screenhand 0.1.1 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (241) hide show
  1. package/README.md +193 -109
  2. package/bin/darwin-arm64/macos-bridge +0 -0
  3. package/dist/mcp-desktop.js +5876 -0
  4. package/dist/scripts/codex-monitor-daemon.js +335 -0
  5. package/dist/scripts/export-help-center.js +112 -0
  6. package/dist/scripts/marketing-loop.js +117 -0
  7. package/dist/scripts/observer-daemon.js +288 -0
  8. package/dist/scripts/orchestrator-daemon.js +399 -0
  9. package/dist/scripts/supervisor-daemon.js +272 -0
  10. package/dist/scripts/threads-campaign.js +208 -0
  11. package/dist/scripts/worker-daemon.js +228 -0
  12. package/dist/src/agent/cli.js +82 -0
  13. package/dist/src/agent/loop.js +274 -0
  14. package/dist/src/community/fetcher.js +109 -0
  15. package/dist/src/community/index.js +6 -0
  16. package/dist/src/community/publisher.js +191 -0
  17. package/dist/src/community/remote-api.js +121 -0
  18. package/dist/src/community/types.js +3 -0
  19. package/dist/src/community/validator.js +95 -0
  20. package/{src/config.ts → dist/src/config.js} +5 -10
  21. package/dist/src/context-tracker.js +489 -0
  22. package/{src/index.ts → dist/src/index.js} +32 -52
  23. package/dist/src/ingestion/coverage-auditor.js +233 -0
  24. package/dist/src/ingestion/doc-parser.js +164 -0
  25. package/dist/src/ingestion/index.js +8 -0
  26. package/dist/src/ingestion/menu-scanner.js +152 -0
  27. package/dist/src/ingestion/reference-merger.js +186 -0
  28. package/dist/src/ingestion/shortcut-extractor.js +180 -0
  29. package/dist/src/ingestion/tutorial-extractor.js +170 -0
  30. package/dist/src/ingestion/types.js +3 -0
  31. package/dist/src/jobs/manager.js +305 -0
  32. package/dist/src/jobs/runner.js +806 -0
  33. package/dist/src/jobs/store.js +102 -0
  34. package/dist/src/jobs/types.js +30 -0
  35. package/dist/src/jobs/worker.js +97 -0
  36. package/dist/src/learning/engine.js +356 -0
  37. package/dist/src/learning/index.js +9 -0
  38. package/dist/src/learning/locator-policy.js +120 -0
  39. package/dist/src/learning/pattern-policy.js +89 -0
  40. package/dist/src/learning/recovery-policy.js +116 -0
  41. package/dist/src/learning/sensor-policy.js +115 -0
  42. package/dist/src/learning/timing-model.js +204 -0
  43. package/dist/src/learning/topology-policy.js +90 -0
  44. package/dist/src/learning/types.js +9 -0
  45. package/dist/src/logging/timeline-logger.js +48 -0
  46. package/dist/src/mcp/mcp-stdio-server.js +464 -0
  47. package/dist/src/mcp/server.js +363 -0
  48. package/dist/src/mcp-entry.js +60 -0
  49. package/dist/src/memory/playbook-seeds.js +200 -0
  50. package/dist/src/memory/recall.js +222 -0
  51. package/dist/src/memory/research.js +104 -0
  52. package/dist/src/memory/seeds.js +101 -0
  53. package/dist/src/memory/service.js +446 -0
  54. package/dist/src/memory/session.js +169 -0
  55. package/dist/src/memory/store.js +451 -0
  56. package/{src/runtime/locator-cache.ts → dist/src/memory/types.js} +1 -17
  57. package/dist/src/monitor/codex-monitor.js +382 -0
  58. package/dist/src/monitor/task-queue.js +97 -0
  59. package/dist/src/monitor/types.js +62 -0
  60. package/dist/src/native/bridge-client.js +412 -0
  61. package/{src/native/macos-bridge-client.ts → dist/src/native/macos-bridge-client.js} +0 -1
  62. package/dist/src/observer/state.js +199 -0
  63. package/dist/src/observer/types.js +43 -0
  64. package/dist/src/orchestrator/state.js +68 -0
  65. package/dist/src/orchestrator/types.js +22 -0
  66. package/dist/src/perception/ax-source.js +162 -0
  67. package/dist/src/perception/cdp-source.js +162 -0
  68. package/dist/src/perception/coordinator.js +771 -0
  69. package/dist/src/perception/frame-differ.js +287 -0
  70. package/dist/src/perception/index.js +22 -0
  71. package/dist/src/perception/manager.js +199 -0
  72. package/dist/src/perception/types.js +47 -0
  73. package/dist/src/perception/vision-source.js +399 -0
  74. package/dist/src/planner/deterministic.js +298 -0
  75. package/dist/src/planner/executor.js +870 -0
  76. package/dist/src/planner/goal-store.js +92 -0
  77. package/dist/src/planner/index.js +21 -0
  78. package/dist/src/planner/planner.js +520 -0
  79. package/dist/src/planner/tool-registry.js +71 -0
  80. package/dist/src/planner/types.js +22 -0
  81. package/dist/src/platform/explorer.js +213 -0
  82. package/dist/src/platform/help-center-markdown.js +527 -0
  83. package/dist/src/platform/learner.js +257 -0
  84. package/dist/src/playbook/engine.js +486 -0
  85. package/dist/src/playbook/index.js +20 -0
  86. package/dist/src/playbook/mcp-recorder.js +204 -0
  87. package/dist/src/playbook/recorder.js +536 -0
  88. package/dist/src/playbook/runner.js +408 -0
  89. package/dist/src/playbook/store.js +312 -0
  90. package/dist/src/playbook/types.js +17 -0
  91. package/dist/src/recovery/detectors.js +156 -0
  92. package/dist/src/recovery/engine.js +327 -0
  93. package/dist/src/recovery/index.js +20 -0
  94. package/dist/src/recovery/strategies.js +274 -0
  95. package/dist/src/recovery/types.js +20 -0
  96. package/dist/src/runtime/accessibility-adapter.js +430 -0
  97. package/dist/src/runtime/app-adapter.js +64 -0
  98. package/dist/src/runtime/applescript-adapter.js +305 -0
  99. package/dist/src/runtime/ax-role-map.js +96 -0
  100. package/dist/src/runtime/browser-adapter.js +52 -0
  101. package/dist/src/runtime/cdp-chrome-adapter.js +521 -0
  102. package/dist/src/runtime/composite-adapter.js +221 -0
  103. package/dist/src/runtime/execution-contract.js +159 -0
  104. package/dist/src/runtime/executor.js +286 -0
  105. package/dist/src/runtime/locator-cache.js +50 -0
  106. package/dist/src/runtime/planning-loop.js +63 -0
  107. package/dist/src/runtime/service.js +432 -0
  108. package/dist/src/runtime/session-manager.js +63 -0
  109. package/dist/src/runtime/state-observer.js +121 -0
  110. package/dist/src/runtime/vision-adapter.js +225 -0
  111. package/dist/src/state/app-map-types.js +72 -0
  112. package/dist/src/state/app-map.js +1974 -0
  113. package/dist/src/state/entity-tracker.js +108 -0
  114. package/dist/src/state/fusion.js +96 -0
  115. package/dist/src/state/index.js +21 -0
  116. package/dist/src/state/ladder-generator.js +236 -0
  117. package/dist/src/state/persistence.js +156 -0
  118. package/dist/src/state/types.js +17 -0
  119. package/dist/src/state/world-model.js +1456 -0
  120. package/dist/src/supervisor/locks.js +186 -0
  121. package/dist/src/supervisor/supervisor.js +403 -0
  122. package/dist/src/supervisor/types.js +30 -0
  123. package/dist/src/test-mcp-protocol.js +154 -0
  124. package/dist/src/types.js +17 -0
  125. package/dist/src/util/atomic-write.js +133 -0
  126. package/dist/src/util/sanitize.js +146 -0
  127. package/dist-app-maps/com.figma.Desktop.json +959 -0
  128. package/dist-app-maps/com.hnc.Discord.json +1146 -0
  129. package/dist-app-maps/notion.id.json +2831 -0
  130. package/dist-playbooks/canva-screenhand-carousel.json +445 -0
  131. package/dist-playbooks/codex-desktop.json +76 -0
  132. package/dist-playbooks/competitor-research-stack.json +122 -0
  133. package/dist-playbooks/davinci-color-grade.json +153 -0
  134. package/dist-playbooks/davinci-edit-timeline.json +162 -0
  135. package/dist-playbooks/davinci-render.json +114 -0
  136. package/dist-playbooks/devto.json +52 -0
  137. package/dist-playbooks/discord.json +41 -0
  138. package/dist-playbooks/google-flow-create-project.json +59 -0
  139. package/dist-playbooks/google-flow-edit-image.json +90 -0
  140. package/dist-playbooks/google-flow-edit-video.json +90 -0
  141. package/dist-playbooks/google-flow-generate-image.json +68 -0
  142. package/dist-playbooks/google-flow-generate-video.json +191 -0
  143. package/dist-playbooks/google-flow-open-project.json +48 -0
  144. package/dist-playbooks/google-flow-open-scenebuilder.json +64 -0
  145. package/dist-playbooks/google-flow-search-assets.json +64 -0
  146. package/dist-playbooks/instagram.json +57 -0
  147. package/dist-playbooks/linkedin.json +52 -0
  148. package/dist-playbooks/n8n.json +43 -0
  149. package/dist-playbooks/reddit.json +52 -0
  150. package/dist-playbooks/threads.json +59 -0
  151. package/dist-playbooks/x-twitter.json +59 -0
  152. package/dist-playbooks/youtube.json +59 -0
  153. package/dist-references/canva.json +646 -0
  154. package/dist-references/codex-desktop.json +305 -0
  155. package/dist-references/davinci-resolve-keyboard.json +594 -0
  156. package/dist-references/davinci-resolve-menu-map.json +1139 -0
  157. package/dist-references/davinci-resolve-menus-batch1.json +116 -0
  158. package/dist-references/davinci-resolve-menus-batch2.json +372 -0
  159. package/dist-references/davinci-resolve-menus-batch3.json +330 -0
  160. package/dist-references/davinci-resolve-menus-batch4.json +297 -0
  161. package/dist-references/davinci-resolve-shortcuts.json +333 -0
  162. package/dist-references/devto.json +317 -0
  163. package/dist-references/discord.json +549 -0
  164. package/dist-references/figma.json +1186 -0
  165. package/dist-references/finder.json +146 -0
  166. package/dist-references/google-ads-transparency.json +95 -0
  167. package/dist-references/google-flow.json +649 -0
  168. package/dist-references/instagram.json +341 -0
  169. package/dist-references/linkedin.json +324 -0
  170. package/dist-references/meta-ad-library.json +86 -0
  171. package/dist-references/n8n.json +387 -0
  172. package/dist-references/notes.json +27 -0
  173. package/dist-references/notion.json +163 -0
  174. package/dist-references/reddit.json +341 -0
  175. package/dist-references/threads.json +337 -0
  176. package/dist-references/x-twitter.json +403 -0
  177. package/dist-references/youtube.json +373 -0
  178. package/native/macos-bridge/Package.swift +1 -0
  179. package/native/macos-bridge/Sources/AccessibilityBridge.swift +257 -36
  180. package/native/macos-bridge/Sources/AppManagement.swift +212 -2
  181. package/native/macos-bridge/Sources/CoreGraphicsBridge.swift +348 -53
  182. package/native/macos-bridge/Sources/StreamCapture.swift +136 -0
  183. package/native/macos-bridge/Sources/VisionBridge.swift +165 -7
  184. package/native/macos-bridge/Sources/main.swift +169 -16
  185. package/native/windows-bridge/Program.cs +5 -0
  186. package/native/windows-bridge/ScreenCapture.cs +124 -0
  187. package/package.json +29 -4
  188. package/scripts/postinstall.cjs +127 -0
  189. package/.claude/commands/automate.md +0 -28
  190. package/.claude/commands/debug-ui.md +0 -19
  191. package/.claude/commands/screenshot.md +0 -15
  192. package/.github/FUNDING.yml +0 -1
  193. package/.github/ISSUE_TEMPLATE/bug_report.md +0 -27
  194. package/.github/ISSUE_TEMPLATE/feature_request.md +0 -20
  195. package/.mcp.json +0 -8
  196. package/DESKTOP_MCP_GUIDE.md +0 -92
  197. package/SECURITY.md +0 -44
  198. package/docs/architecture.md +0 -47
  199. package/install-skills.sh +0 -19
  200. package/mcp-bridge.ts +0 -271
  201. package/mcp-desktop.ts +0 -1221
  202. package/playbooks/instagram.json +0 -41
  203. package/playbooks/instagram_v2.json +0 -201
  204. package/playbooks/x_v1.json +0 -211
  205. package/scripts/devpost-live-loop.mjs +0 -421
  206. package/src/logging/timeline-logger.ts +0 -55
  207. package/src/mcp/server.ts +0 -449
  208. package/src/memory/recall.ts +0 -191
  209. package/src/memory/research.ts +0 -146
  210. package/src/memory/seeds.ts +0 -123
  211. package/src/memory/session.ts +0 -201
  212. package/src/memory/store.ts +0 -434
  213. package/src/memory/types.ts +0 -69
  214. package/src/native/bridge-client.ts +0 -239
  215. package/src/runtime/accessibility-adapter.ts +0 -487
  216. package/src/runtime/app-adapter.ts +0 -169
  217. package/src/runtime/applescript-adapter.ts +0 -376
  218. package/src/runtime/ax-role-map.ts +0 -102
  219. package/src/runtime/browser-adapter.ts +0 -129
  220. package/src/runtime/cdp-chrome-adapter.ts +0 -676
  221. package/src/runtime/composite-adapter.ts +0 -274
  222. package/src/runtime/executor.ts +0 -396
  223. package/src/runtime/planning-loop.ts +0 -81
  224. package/src/runtime/service.ts +0 -448
  225. package/src/runtime/session-manager.ts +0 -50
  226. package/src/runtime/state-observer.ts +0 -136
  227. package/src/runtime/vision-adapter.ts +0 -297
  228. package/src/types.ts +0 -297
  229. package/tests/bridge-client.test.ts +0 -176
  230. package/tests/browser-stealth.test.ts +0 -210
  231. package/tests/composite-adapter.test.ts +0 -64
  232. package/tests/mcp-server.test.ts +0 -151
  233. package/tests/memory-recall.test.ts +0 -339
  234. package/tests/memory-research.test.ts +0 -159
  235. package/tests/memory-seeds.test.ts +0 -120
  236. package/tests/memory-store.test.ts +0 -392
  237. package/tests/types.test.ts +0 -92
  238. package/tsconfig.check.json +0 -17
  239. package/tsconfig.json +0 -19
  240. package/vitest.config.ts +0 -8
  241. /package/{playbooks → dist-references}/devpost.json +0 -0
@@ -0,0 +1,305 @@
1
+ // Copyright (C) 2025 Clazro Technology Private Limited
2
+ // SPDX-License-Identifier: AGPL-3.0-only
3
+ //
4
+ // This file is part of ScreenHand.
5
+ //
6
+ // ScreenHand is free software: you can redistribute it and/or modify
7
+ // it under the terms of the GNU Affero General Public License as
8
+ // published by the Free Software Foundation, version 3.
9
+ //
10
+ // ScreenHand is distributed in the hope that it will be useful,
11
+ // but WITHOUT ANY WARRANTY; without even the implied warranty of
12
+ // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
+ // GNU Affero General Public License for more details.
14
+ //
15
+ // You should have received a copy of the GNU Affero General Public License
16
+ // along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
17
+ import { execFile } from "node:child_process";
18
+ import { randomUUID } from "node:crypto";
19
+ import { promisify } from "node:util";
20
+ const execFileAsync = promisify(execFile);
21
+ const POLL_INTERVAL_MS = 100;
22
+ /** Apps known to have AppleScript scripting dictionaries. */
23
+ const SCRIPTABLE_APPS = {
24
+ "com.apple.finder": "Finder",
25
+ "com.apple.Safari": "Safari",
26
+ "com.apple.mail": "Mail",
27
+ "com.apple.iWork.Pages": "Pages",
28
+ "com.apple.iWork.Keynote": "Keynote",
29
+ "com.apple.iWork.Numbers": "Numbers",
30
+ "com.apple.Notes": "Notes",
31
+ "com.apple.reminders": "Reminders",
32
+ "com.apple.iCal": "Calendar",
33
+ "com.apple.TextEdit": "TextEdit",
34
+ "com.apple.Preview": "Preview",
35
+ "com.apple.systempreferences": "System Preferences",
36
+ "com.apple.Terminal": "Terminal",
37
+ "com.apple.Music": "Music",
38
+ "com.apple.TV": "TV",
39
+ "com.apple.Podcasts": "Podcasts",
40
+ };
41
+ export class AppleScriptAdapter {
42
+ sessions = new Map();
43
+ sessionsByProfile = new Map();
44
+ /** Check if a bundle ID is scriptable. */
45
+ static isScriptable(bundleId) {
46
+ return bundleId in SCRIPTABLE_APPS;
47
+ }
48
+ async attach(profile, reuseSessionId) {
49
+ const existing = this.sessionsByProfile.get(profile);
50
+ if (existing)
51
+ return existing.info;
52
+ const info = {
53
+ sessionId: reuseSessionId ?? `as_session_${profile}_${Date.now()}_${randomUUID().slice(0, 8)}`,
54
+ profile,
55
+ createdAt: new Date().toISOString(),
56
+ adapterType: "applescript",
57
+ };
58
+ // Default to Finder
59
+ const state = {
60
+ info,
61
+ appName: "Finder",
62
+ bundleId: "com.apple.finder",
63
+ };
64
+ this.sessions.set(info.sessionId, state);
65
+ this.sessionsByProfile.set(profile, state);
66
+ return info;
67
+ }
68
+ async getAppContext(sessionId) {
69
+ const state = this.requireSession(sessionId);
70
+ const windowTitle = await this.runScript(`tell application "${state.appName}" to get name of front window`).catch(() => state.appName);
71
+ const pidStr = await this.runScript(`tell application "System Events" to get unix id of (first process whose bundle identifier is "${state.bundleId}")`).catch(() => "0");
72
+ return {
73
+ bundleId: state.bundleId,
74
+ appName: state.appName,
75
+ pid: parseInt(pidStr, 10) || 0,
76
+ windowTitle,
77
+ };
78
+ }
79
+ async getPageMeta(sessionId) {
80
+ const ctx = await this.getAppContext(sessionId);
81
+ let url = `app://${ctx.bundleId}`;
82
+ // For Safari, get the current URL
83
+ if (ctx.bundleId === "com.apple.Safari") {
84
+ try {
85
+ url = await this.runScript('tell application "Safari" to get URL of current tab of front window');
86
+ }
87
+ catch {
88
+ // Ignore
89
+ }
90
+ }
91
+ return { url, title: ctx.windowTitle };
92
+ }
93
+ async navigate(sessionId, url, _timeoutMs) {
94
+ const state = this.requireSession(sessionId);
95
+ if (url.startsWith("app://")) {
96
+ const bundleId = url.slice(6);
97
+ const appName = SCRIPTABLE_APPS[bundleId] ?? bundleId;
98
+ state.bundleId = bundleId;
99
+ state.appName = appName;
100
+ await this.runScript(`tell application "${appName}" to activate`);
101
+ }
102
+ else if (state.bundleId === "com.apple.Safari") {
103
+ await this.runScript(`tell application "Safari" to set URL of current tab of front window to "${this.escapeAS(url)}"`);
104
+ }
105
+ else if (state.bundleId === "com.apple.finder") {
106
+ // Open path in Finder
107
+ await this.runScript(`tell application "Finder" to open POSIX file "${this.escapeAS(url)}"`);
108
+ }
109
+ return this.getPageMeta(sessionId);
110
+ }
111
+ async locate(sessionId, target, timeoutMs) {
112
+ const state = this.requireSession(sessionId);
113
+ const deadline = Date.now() + timeoutMs;
114
+ while (Date.now() < deadline) {
115
+ try {
116
+ const script = this.buildLocateScript(state, target);
117
+ const result = await this.runScript(script);
118
+ if (result && result !== "missing value") {
119
+ return {
120
+ handleId: `as_${result.replace(/\s+/g, "_").slice(0, 50)}`,
121
+ locatorUsed: `applescript:${target.type}`,
122
+ label: result,
123
+ };
124
+ }
125
+ }
126
+ catch {
127
+ // Not found yet
128
+ }
129
+ await sleep(POLL_INTERVAL_MS);
130
+ }
131
+ return null;
132
+ }
133
+ async click(sessionId, element) {
134
+ const state = this.requireSession(sessionId);
135
+ await this.runScript(`tell application "System Events" to tell process "${state.appName}" to click button "${this.escapeAS(element.label ?? element.handleId)}" of front window`);
136
+ }
137
+ async setValue(sessionId, element, text, _clear) {
138
+ const state = this.requireSession(sessionId);
139
+ await this.runScript(`tell application "System Events" to tell process "${state.appName}" to set value of text field "${this.escapeAS(element.label ?? "")}" of front window to "${this.escapeAS(text)}"`);
140
+ }
141
+ async getValue(sessionId, element) {
142
+ const state = this.requireSession(sessionId);
143
+ return this.runScript(`tell application "System Events" to tell process "${state.appName}" to get value of text field "${this.escapeAS(element.label ?? "")}" of front window`);
144
+ }
145
+ async waitFor(sessionId, condition, timeoutMs) {
146
+ const deadline = Date.now() + timeoutMs;
147
+ while (Date.now() < deadline) {
148
+ try {
149
+ if (condition.type === "text_appears") {
150
+ const found = await this.locate(sessionId, { type: "text", value: condition.text }, 200);
151
+ if (found)
152
+ return true;
153
+ }
154
+ else if (condition.type === "window_title_matches") {
155
+ const ctx = await this.getAppContext(sessionId);
156
+ if (new RegExp(condition.regex).test(ctx.windowTitle))
157
+ return true;
158
+ }
159
+ }
160
+ catch {
161
+ // Keep trying
162
+ }
163
+ await sleep(POLL_INTERVAL_MS);
164
+ }
165
+ return false;
166
+ }
167
+ async extract(sessionId, target, format) {
168
+ const state = this.requireSession(sessionId);
169
+ if (state.bundleId === "com.apple.finder" && format === "json") {
170
+ // Get selected files
171
+ const result = await this.runScript('tell application "Finder" to get name of every item of (target of front window) as list');
172
+ return { items: result.split(", ") };
173
+ }
174
+ // Generic: extract UI element text
175
+ const element = await this.locate(sessionId, target, 1500);
176
+ if (!element)
177
+ throw new Error("Extract target not found");
178
+ return element.label ?? "";
179
+ }
180
+ async screenshot(_sessionId, _region) {
181
+ const path = `/tmp/as_screenshot_${Date.now()}.png`;
182
+ await this.runScript(`do shell script "screencapture -x '${path}'"`);
183
+ return path;
184
+ }
185
+ // ── Desktop methods ──
186
+ async launchApp(sessionId, bundleId) {
187
+ const state = this.requireSession(sessionId);
188
+ const appName = SCRIPTABLE_APPS[bundleId] ?? bundleId;
189
+ await this.runScript(`tell application "${appName}" to activate`);
190
+ state.bundleId = bundleId;
191
+ state.appName = appName;
192
+ return this.getAppContext(sessionId);
193
+ }
194
+ async focusApp(sessionId, bundleId) {
195
+ const appName = SCRIPTABLE_APPS[bundleId] ?? bundleId;
196
+ await this.runScript(`tell application "${appName}" to activate`);
197
+ const state = this.requireSession(sessionId);
198
+ state.bundleId = bundleId;
199
+ state.appName = appName;
200
+ }
201
+ async listApps(_sessionId) {
202
+ const result = await this.runScript('tell application "System Events" to get {bundle identifier, name, unix id, frontmost} of every application process whose background only is false');
203
+ // Parse the AppleScript list output
204
+ const parts = result.split(", ");
205
+ const count = Math.floor(parts.length / 4);
206
+ const apps = [];
207
+ for (let i = 0; i < count; i++) {
208
+ apps.push({
209
+ bundleId: parts[i] ?? "unknown",
210
+ name: parts[count + i] ?? "Unknown",
211
+ pid: parseInt(parts[2 * count + i] ?? "0", 10),
212
+ isActive: parts[3 * count + i] === "true",
213
+ });
214
+ }
215
+ return apps;
216
+ }
217
+ async listWindows(_sessionId) {
218
+ // Simplified — AppleScript window listing is limited
219
+ const result = await this.runScript('tell application "System Events" to get {name, position, size} of every window of (first process whose frontmost is true)');
220
+ return [{
221
+ windowId: 0,
222
+ title: result,
223
+ bundleId: "",
224
+ pid: 0,
225
+ bounds: { x: 0, y: 0, width: 0, height: 0 },
226
+ isOnScreen: true,
227
+ }];
228
+ }
229
+ async menuClick(sessionId, menuPath) {
230
+ const state = this.requireSession(sessionId);
231
+ if (menuPath.length === 0)
232
+ throw new Error("menuPath must not be empty");
233
+ let script = `tell application "System Events" to tell process "${state.appName}"\n`;
234
+ if (menuPath.length === 1) {
235
+ script += ` click menu item "${this.escapeAS(menuPath[0])}" of menu bar 1\n`;
236
+ }
237
+ else if (menuPath.length === 2) {
238
+ script += ` click menu item "${this.escapeAS(menuPath[1])}" of menu "${this.escapeAS(menuPath[0])}" of menu bar 1\n`;
239
+ }
240
+ else {
241
+ // Deep menu path
242
+ script += ` click menu item "${this.escapeAS(menuPath[menuPath.length - 1])}" of menu "${this.escapeAS(menuPath[menuPath.length - 2])}"`;
243
+ for (let i = menuPath.length - 3; i >= 0; i--) {
244
+ script += ` of menu item "${this.escapeAS(menuPath[i])}" of menu "${this.escapeAS(menuPath[i])}"`;
245
+ }
246
+ script += ` of menu bar 1\n`;
247
+ }
248
+ script += `end tell`;
249
+ await this.runScript(script);
250
+ }
251
+ async keyCombo(_sessionId, keys) {
252
+ const modifiers = [];
253
+ let keyChar = "";
254
+ for (const key of keys) {
255
+ const lower = key.toLowerCase();
256
+ if (lower === "cmd" || lower === "command")
257
+ modifiers.push("command down");
258
+ else if (lower === "shift")
259
+ modifiers.push("shift down");
260
+ else if (lower === "alt" || lower === "option")
261
+ modifiers.push("option down");
262
+ else if (lower === "ctrl" || lower === "control")
263
+ modifiers.push("control down");
264
+ else
265
+ keyChar = lower;
266
+ }
267
+ const modStr = modifiers.length > 0 ? ` using {${modifiers.join(", ")}}` : "";
268
+ await this.runScript(`tell application "System Events" to keystroke "${this.escapeAS(keyChar)}"${modStr}`);
269
+ }
270
+ // ── Private helpers ──
271
+ requireSession(sessionId) {
272
+ const state = this.sessions.get(sessionId);
273
+ if (!state)
274
+ throw new Error(`Session not found: ${sessionId}`);
275
+ return state;
276
+ }
277
+ async runScript(script) {
278
+ const { stdout } = await execFileAsync("osascript", ["-e", script], {
279
+ timeout: 10_000,
280
+ });
281
+ return stdout.trim();
282
+ }
283
+ buildLocateScript(state, target) {
284
+ const proc = state.appName;
285
+ if (target.type === "text" || target.type === "role") {
286
+ const searchText = target.type === "text" ? target.value : target.name;
287
+ return `tell application "System Events" to tell process "${proc}" to get name of first UI element of front window whose name contains "${this.escapeAS(searchText)}"`;
288
+ }
289
+ if (target.type === "selector") {
290
+ return `tell application "System Events" to tell process "${proc}" to get name of first UI element of front window whose description contains "${this.escapeAS(target.value)}"`;
291
+ }
292
+ throw new Error(`AppleScript adapter does not support target type: ${target.type}`);
293
+ }
294
+ escapeAS(str) {
295
+ return str
296
+ .replace(/\\/g, "\\\\")
297
+ .replace(/"/g, '\\"')
298
+ .replace(/\n/g, "\\n")
299
+ .replace(/\r/g, "\\r")
300
+ .replace(/\0/g, "");
301
+ }
302
+ }
303
+ function sleep(ms) {
304
+ return new Promise((resolve) => setTimeout(resolve, ms));
305
+ }
@@ -0,0 +1,96 @@
1
+ // Copyright (C) 2025 Clazro Technology Private Limited
2
+ // SPDX-License-Identifier: AGPL-3.0-only
3
+ //
4
+ // This file is part of ScreenHand.
5
+ //
6
+ // ScreenHand is free software: you can redistribute it and/or modify
7
+ // it under the terms of the GNU Affero General Public License as
8
+ // published by the Free Software Foundation, version 3.
9
+ //
10
+ // ScreenHand is distributed in the hope that it will be useful,
11
+ // but WITHOUT ANY WARRANTY; without even the implied warranty of
12
+ // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
+ // GNU Affero General Public License for more details.
14
+ //
15
+ // You should have received a copy of the GNU Affero General Public License
16
+ // along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
17
+ /**
18
+ * Maps web ARIA roles to macOS Accessibility roles.
19
+ * Used to translate web-style role targets to native AX queries.
20
+ */
21
+ export const WEB_TO_AX_ROLE = {
22
+ // Interactive
23
+ button: "AXButton",
24
+ link: "AXLink",
25
+ textbox: "AXTextField",
26
+ checkbox: "AXCheckBox",
27
+ radio: "AXRadioButton",
28
+ combobox: "AXComboBox",
29
+ slider: "AXSlider",
30
+ switch: "AXCheckBox",
31
+ tab: "AXRadioButton",
32
+ menuitem: "AXMenuItem",
33
+ menu: "AXMenu",
34
+ menubar: "AXMenuBar",
35
+ option: "AXMenuItem",
36
+ listbox: "AXList",
37
+ spinbutton: "AXIncrementor",
38
+ scrollbar: "AXScrollBar",
39
+ // Structure
40
+ heading: "AXHeading",
41
+ list: "AXList",
42
+ listitem: "AXGroup",
43
+ table: "AXTable",
44
+ row: "AXRow",
45
+ cell: "AXCell",
46
+ grid: "AXTable",
47
+ treegrid: "AXOutline",
48
+ tree: "AXOutline",
49
+ treeitem: "AXOutlineRow",
50
+ toolbar: "AXToolbar",
51
+ tablist: "AXTabGroup",
52
+ tabpanel: "AXGroup",
53
+ group: "AXGroup",
54
+ region: "AXGroup",
55
+ dialog: "AXSheet",
56
+ alertdialog: "AXSheet",
57
+ // Semantic
58
+ img: "AXImage",
59
+ image: "AXImage",
60
+ progressbar: "AXProgressIndicator",
61
+ separator: "AXSplitter",
62
+ status: "AXStaticText",
63
+ tooltip: "AXHelpTag",
64
+ banner: "AXGroup",
65
+ navigation: "AXGroup",
66
+ main: "AXGroup",
67
+ contentinfo: "AXGroup",
68
+ complementary: "AXGroup",
69
+ article: "AXGroup",
70
+ document: "AXGroup",
71
+ // Text
72
+ statictext: "AXStaticText",
73
+ textarea: "AXTextArea",
74
+ text: "AXStaticText",
75
+ // Window-level
76
+ window: "AXWindow",
77
+ application: "AXApplication",
78
+ };
79
+ /**
80
+ * Maps macOS AX roles back to web ARIA roles.
81
+ */
82
+ export const AX_TO_WEB_ROLE = {};
83
+ for (const [web, ax] of Object.entries(WEB_TO_AX_ROLE)) {
84
+ if (!(ax in AX_TO_WEB_ROLE)) {
85
+ AX_TO_WEB_ROLE[ax] = web;
86
+ }
87
+ }
88
+ /**
89
+ * Convert a web-style role to macOS AX role.
90
+ * If already an AX role (starts with "AX"), pass through.
91
+ */
92
+ export function toAXRole(role) {
93
+ if (role.startsWith("AX"))
94
+ return role;
95
+ return WEB_TO_AX_ROLE[role.toLowerCase()] ?? role;
96
+ }
@@ -0,0 +1,52 @@
1
+ // Copyright (C) 2025 Clazro Technology Private Limited
2
+ // SPDX-License-Identifier: AGPL-3.0-only
3
+ //
4
+ // This file is part of ScreenHand.
5
+ //
6
+ // ScreenHand is free software: you can redistribute it and/or modify
7
+ // it under the terms of the GNU Affero General Public License as
8
+ // published by the Free Software Foundation, version 3.
9
+ //
10
+ // ScreenHand is distributed in the hope that it will be useful,
11
+ // but WITHOUT ANY WARRANTY; without even the implied warranty of
12
+ // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
+ // GNU Affero General Public License for more details.
14
+ //
15
+ // You should have received a copy of the GNU Affero General Public License
16
+ // along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
17
+ export class PlaceholderBrowserAdapter {
18
+ async connect(profile) {
19
+ return {
20
+ sessionId: `session_${profile}_${Date.now()}`,
21
+ profile,
22
+ createdAt: new Date().toISOString(),
23
+ };
24
+ }
25
+ async getPageMeta(_sessionId) {
26
+ return { url: "about:blank", title: "Placeholder Session" };
27
+ }
28
+ async navigate(_sessionId, url, _timeoutMs) {
29
+ return { url, title: "Placeholder Navigation" };
30
+ }
31
+ async locate(_sessionId, _target, _timeoutMs) {
32
+ throw new Error("Browser adapter not implemented: locate");
33
+ }
34
+ async click(_sessionId, _element) {
35
+ throw new Error("Browser adapter not implemented: click");
36
+ }
37
+ async setValue(_sessionId, _element, _text, _clear) {
38
+ throw new Error("Browser adapter not implemented: setValue");
39
+ }
40
+ async getValue(_sessionId, _element) {
41
+ throw new Error("Browser adapter not implemented: getValue");
42
+ }
43
+ async waitFor(_sessionId, _condition, _timeoutMs) {
44
+ throw new Error("Browser adapter not implemented: waitFor");
45
+ }
46
+ async extract(_sessionId, _target, _format) {
47
+ throw new Error("Browser adapter not implemented: extract");
48
+ }
49
+ async screenshot(_sessionId, _region) {
50
+ throw new Error("Browser adapter not implemented: screenshot");
51
+ }
52
+ }