screenhand 0.1.1 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (241) hide show
  1. package/README.md +193 -109
  2. package/bin/darwin-arm64/macos-bridge +0 -0
  3. package/dist/mcp-desktop.js +5876 -0
  4. package/dist/scripts/codex-monitor-daemon.js +335 -0
  5. package/dist/scripts/export-help-center.js +112 -0
  6. package/dist/scripts/marketing-loop.js +117 -0
  7. package/dist/scripts/observer-daemon.js +288 -0
  8. package/dist/scripts/orchestrator-daemon.js +399 -0
  9. package/dist/scripts/supervisor-daemon.js +272 -0
  10. package/dist/scripts/threads-campaign.js +208 -0
  11. package/dist/scripts/worker-daemon.js +228 -0
  12. package/dist/src/agent/cli.js +82 -0
  13. package/dist/src/agent/loop.js +274 -0
  14. package/dist/src/community/fetcher.js +109 -0
  15. package/dist/src/community/index.js +6 -0
  16. package/dist/src/community/publisher.js +191 -0
  17. package/dist/src/community/remote-api.js +121 -0
  18. package/dist/src/community/types.js +3 -0
  19. package/dist/src/community/validator.js +95 -0
  20. package/{src/config.ts → dist/src/config.js} +5 -10
  21. package/dist/src/context-tracker.js +489 -0
  22. package/{src/index.ts → dist/src/index.js} +32 -52
  23. package/dist/src/ingestion/coverage-auditor.js +233 -0
  24. package/dist/src/ingestion/doc-parser.js +164 -0
  25. package/dist/src/ingestion/index.js +8 -0
  26. package/dist/src/ingestion/menu-scanner.js +152 -0
  27. package/dist/src/ingestion/reference-merger.js +186 -0
  28. package/dist/src/ingestion/shortcut-extractor.js +180 -0
  29. package/dist/src/ingestion/tutorial-extractor.js +170 -0
  30. package/dist/src/ingestion/types.js +3 -0
  31. package/dist/src/jobs/manager.js +305 -0
  32. package/dist/src/jobs/runner.js +806 -0
  33. package/dist/src/jobs/store.js +102 -0
  34. package/dist/src/jobs/types.js +30 -0
  35. package/dist/src/jobs/worker.js +97 -0
  36. package/dist/src/learning/engine.js +356 -0
  37. package/dist/src/learning/index.js +9 -0
  38. package/dist/src/learning/locator-policy.js +120 -0
  39. package/dist/src/learning/pattern-policy.js +89 -0
  40. package/dist/src/learning/recovery-policy.js +116 -0
  41. package/dist/src/learning/sensor-policy.js +115 -0
  42. package/dist/src/learning/timing-model.js +204 -0
  43. package/dist/src/learning/topology-policy.js +90 -0
  44. package/dist/src/learning/types.js +9 -0
  45. package/dist/src/logging/timeline-logger.js +48 -0
  46. package/dist/src/mcp/mcp-stdio-server.js +464 -0
  47. package/dist/src/mcp/server.js +363 -0
  48. package/dist/src/mcp-entry.js +60 -0
  49. package/dist/src/memory/playbook-seeds.js +200 -0
  50. package/dist/src/memory/recall.js +222 -0
  51. package/dist/src/memory/research.js +104 -0
  52. package/dist/src/memory/seeds.js +101 -0
  53. package/dist/src/memory/service.js +446 -0
  54. package/dist/src/memory/session.js +169 -0
  55. package/dist/src/memory/store.js +451 -0
  56. package/{src/runtime/locator-cache.ts → dist/src/memory/types.js} +1 -17
  57. package/dist/src/monitor/codex-monitor.js +382 -0
  58. package/dist/src/monitor/task-queue.js +97 -0
  59. package/dist/src/monitor/types.js +62 -0
  60. package/dist/src/native/bridge-client.js +412 -0
  61. package/{src/native/macos-bridge-client.ts → dist/src/native/macos-bridge-client.js} +0 -1
  62. package/dist/src/observer/state.js +199 -0
  63. package/dist/src/observer/types.js +43 -0
  64. package/dist/src/orchestrator/state.js +68 -0
  65. package/dist/src/orchestrator/types.js +22 -0
  66. package/dist/src/perception/ax-source.js +162 -0
  67. package/dist/src/perception/cdp-source.js +162 -0
  68. package/dist/src/perception/coordinator.js +771 -0
  69. package/dist/src/perception/frame-differ.js +287 -0
  70. package/dist/src/perception/index.js +22 -0
  71. package/dist/src/perception/manager.js +199 -0
  72. package/dist/src/perception/types.js +47 -0
  73. package/dist/src/perception/vision-source.js +399 -0
  74. package/dist/src/planner/deterministic.js +298 -0
  75. package/dist/src/planner/executor.js +870 -0
  76. package/dist/src/planner/goal-store.js +92 -0
  77. package/dist/src/planner/index.js +21 -0
  78. package/dist/src/planner/planner.js +520 -0
  79. package/dist/src/planner/tool-registry.js +71 -0
  80. package/dist/src/planner/types.js +22 -0
  81. package/dist/src/platform/explorer.js +213 -0
  82. package/dist/src/platform/help-center-markdown.js +527 -0
  83. package/dist/src/platform/learner.js +257 -0
  84. package/dist/src/playbook/engine.js +486 -0
  85. package/dist/src/playbook/index.js +20 -0
  86. package/dist/src/playbook/mcp-recorder.js +204 -0
  87. package/dist/src/playbook/recorder.js +536 -0
  88. package/dist/src/playbook/runner.js +408 -0
  89. package/dist/src/playbook/store.js +312 -0
  90. package/dist/src/playbook/types.js +17 -0
  91. package/dist/src/recovery/detectors.js +156 -0
  92. package/dist/src/recovery/engine.js +327 -0
  93. package/dist/src/recovery/index.js +20 -0
  94. package/dist/src/recovery/strategies.js +274 -0
  95. package/dist/src/recovery/types.js +20 -0
  96. package/dist/src/runtime/accessibility-adapter.js +430 -0
  97. package/dist/src/runtime/app-adapter.js +64 -0
  98. package/dist/src/runtime/applescript-adapter.js +305 -0
  99. package/dist/src/runtime/ax-role-map.js +96 -0
  100. package/dist/src/runtime/browser-adapter.js +52 -0
  101. package/dist/src/runtime/cdp-chrome-adapter.js +521 -0
  102. package/dist/src/runtime/composite-adapter.js +221 -0
  103. package/dist/src/runtime/execution-contract.js +159 -0
  104. package/dist/src/runtime/executor.js +286 -0
  105. package/dist/src/runtime/locator-cache.js +50 -0
  106. package/dist/src/runtime/planning-loop.js +63 -0
  107. package/dist/src/runtime/service.js +432 -0
  108. package/dist/src/runtime/session-manager.js +63 -0
  109. package/dist/src/runtime/state-observer.js +121 -0
  110. package/dist/src/runtime/vision-adapter.js +225 -0
  111. package/dist/src/state/app-map-types.js +72 -0
  112. package/dist/src/state/app-map.js +1974 -0
  113. package/dist/src/state/entity-tracker.js +108 -0
  114. package/dist/src/state/fusion.js +96 -0
  115. package/dist/src/state/index.js +21 -0
  116. package/dist/src/state/ladder-generator.js +236 -0
  117. package/dist/src/state/persistence.js +156 -0
  118. package/dist/src/state/types.js +17 -0
  119. package/dist/src/state/world-model.js +1456 -0
  120. package/dist/src/supervisor/locks.js +186 -0
  121. package/dist/src/supervisor/supervisor.js +403 -0
  122. package/dist/src/supervisor/types.js +30 -0
  123. package/dist/src/test-mcp-protocol.js +154 -0
  124. package/dist/src/types.js +17 -0
  125. package/dist/src/util/atomic-write.js +133 -0
  126. package/dist/src/util/sanitize.js +146 -0
  127. package/dist-app-maps/com.figma.Desktop.json +959 -0
  128. package/dist-app-maps/com.hnc.Discord.json +1146 -0
  129. package/dist-app-maps/notion.id.json +2831 -0
  130. package/dist-playbooks/canva-screenhand-carousel.json +445 -0
  131. package/dist-playbooks/codex-desktop.json +76 -0
  132. package/dist-playbooks/competitor-research-stack.json +122 -0
  133. package/dist-playbooks/davinci-color-grade.json +153 -0
  134. package/dist-playbooks/davinci-edit-timeline.json +162 -0
  135. package/dist-playbooks/davinci-render.json +114 -0
  136. package/dist-playbooks/devto.json +52 -0
  137. package/dist-playbooks/discord.json +41 -0
  138. package/dist-playbooks/google-flow-create-project.json +59 -0
  139. package/dist-playbooks/google-flow-edit-image.json +90 -0
  140. package/dist-playbooks/google-flow-edit-video.json +90 -0
  141. package/dist-playbooks/google-flow-generate-image.json +68 -0
  142. package/dist-playbooks/google-flow-generate-video.json +191 -0
  143. package/dist-playbooks/google-flow-open-project.json +48 -0
  144. package/dist-playbooks/google-flow-open-scenebuilder.json +64 -0
  145. package/dist-playbooks/google-flow-search-assets.json +64 -0
  146. package/dist-playbooks/instagram.json +57 -0
  147. package/dist-playbooks/linkedin.json +52 -0
  148. package/dist-playbooks/n8n.json +43 -0
  149. package/dist-playbooks/reddit.json +52 -0
  150. package/dist-playbooks/threads.json +59 -0
  151. package/dist-playbooks/x-twitter.json +59 -0
  152. package/dist-playbooks/youtube.json +59 -0
  153. package/dist-references/canva.json +646 -0
  154. package/dist-references/codex-desktop.json +305 -0
  155. package/dist-references/davinci-resolve-keyboard.json +594 -0
  156. package/dist-references/davinci-resolve-menu-map.json +1139 -0
  157. package/dist-references/davinci-resolve-menus-batch1.json +116 -0
  158. package/dist-references/davinci-resolve-menus-batch2.json +372 -0
  159. package/dist-references/davinci-resolve-menus-batch3.json +330 -0
  160. package/dist-references/davinci-resolve-menus-batch4.json +297 -0
  161. package/dist-references/davinci-resolve-shortcuts.json +333 -0
  162. package/dist-references/devto.json +317 -0
  163. package/dist-references/discord.json +549 -0
  164. package/dist-references/figma.json +1186 -0
  165. package/dist-references/finder.json +146 -0
  166. package/dist-references/google-ads-transparency.json +95 -0
  167. package/dist-references/google-flow.json +649 -0
  168. package/dist-references/instagram.json +341 -0
  169. package/dist-references/linkedin.json +324 -0
  170. package/dist-references/meta-ad-library.json +86 -0
  171. package/dist-references/n8n.json +387 -0
  172. package/dist-references/notes.json +27 -0
  173. package/dist-references/notion.json +163 -0
  174. package/dist-references/reddit.json +341 -0
  175. package/dist-references/threads.json +337 -0
  176. package/dist-references/x-twitter.json +403 -0
  177. package/dist-references/youtube.json +373 -0
  178. package/native/macos-bridge/Package.swift +1 -0
  179. package/native/macos-bridge/Sources/AccessibilityBridge.swift +257 -36
  180. package/native/macos-bridge/Sources/AppManagement.swift +212 -2
  181. package/native/macos-bridge/Sources/CoreGraphicsBridge.swift +348 -53
  182. package/native/macos-bridge/Sources/StreamCapture.swift +136 -0
  183. package/native/macos-bridge/Sources/VisionBridge.swift +165 -7
  184. package/native/macos-bridge/Sources/main.swift +169 -16
  185. package/native/windows-bridge/Program.cs +5 -0
  186. package/native/windows-bridge/ScreenCapture.cs +124 -0
  187. package/package.json +29 -4
  188. package/scripts/postinstall.cjs +127 -0
  189. package/.claude/commands/automate.md +0 -28
  190. package/.claude/commands/debug-ui.md +0 -19
  191. package/.claude/commands/screenshot.md +0 -15
  192. package/.github/FUNDING.yml +0 -1
  193. package/.github/ISSUE_TEMPLATE/bug_report.md +0 -27
  194. package/.github/ISSUE_TEMPLATE/feature_request.md +0 -20
  195. package/.mcp.json +0 -8
  196. package/DESKTOP_MCP_GUIDE.md +0 -92
  197. package/SECURITY.md +0 -44
  198. package/docs/architecture.md +0 -47
  199. package/install-skills.sh +0 -19
  200. package/mcp-bridge.ts +0 -271
  201. package/mcp-desktop.ts +0 -1221
  202. package/playbooks/instagram.json +0 -41
  203. package/playbooks/instagram_v2.json +0 -201
  204. package/playbooks/x_v1.json +0 -211
  205. package/scripts/devpost-live-loop.mjs +0 -421
  206. package/src/logging/timeline-logger.ts +0 -55
  207. package/src/mcp/server.ts +0 -449
  208. package/src/memory/recall.ts +0 -191
  209. package/src/memory/research.ts +0 -146
  210. package/src/memory/seeds.ts +0 -123
  211. package/src/memory/session.ts +0 -201
  212. package/src/memory/store.ts +0 -434
  213. package/src/memory/types.ts +0 -69
  214. package/src/native/bridge-client.ts +0 -239
  215. package/src/runtime/accessibility-adapter.ts +0 -487
  216. package/src/runtime/app-adapter.ts +0 -169
  217. package/src/runtime/applescript-adapter.ts +0 -376
  218. package/src/runtime/ax-role-map.ts +0 -102
  219. package/src/runtime/browser-adapter.ts +0 -129
  220. package/src/runtime/cdp-chrome-adapter.ts +0 -676
  221. package/src/runtime/composite-adapter.ts +0 -274
  222. package/src/runtime/executor.ts +0 -396
  223. package/src/runtime/planning-loop.ts +0 -81
  224. package/src/runtime/service.ts +0 -448
  225. package/src/runtime/session-manager.ts +0 -50
  226. package/src/runtime/state-observer.ts +0 -136
  227. package/src/runtime/vision-adapter.ts +0 -297
  228. package/src/types.ts +0 -297
  229. package/tests/bridge-client.test.ts +0 -176
  230. package/tests/browser-stealth.test.ts +0 -210
  231. package/tests/composite-adapter.test.ts +0 -64
  232. package/tests/mcp-server.test.ts +0 -151
  233. package/tests/memory-recall.test.ts +0 -339
  234. package/tests/memory-research.test.ts +0 -159
  235. package/tests/memory-seeds.test.ts +0 -120
  236. package/tests/memory-store.test.ts +0 -392
  237. package/tests/types.test.ts +0 -92
  238. package/tsconfig.check.json +0 -17
  239. package/tsconfig.json +0 -19
  240. package/vitest.config.ts +0 -8
  241. /package/{playbooks → dist-references}/devpost.json +0 -0
@@ -0,0 +1,204 @@
1
+ // Copyright (C) 2025 Clazro Technology Private Limited
2
+ // SPDX-License-Identifier: AGPL-3.0-only
3
+ /**
4
+ * McpPlaybookRecorder — captures MCP tool calls as PlaybookSteps.
5
+ *
6
+ * Start recording → agent does the flow → stop → saves as executable playbook.
7
+ * Like a macro recorder, but for AI tool calls.
8
+ */
9
+ import fs from "node:fs";
10
+ import path from "node:path";
11
+ import { writeFileAtomicSync } from "../util/atomic-write.js";
12
+ import { redactPII } from "../util/sanitize.js";
13
+ /** Tools that are observation-only — not recorded as steps */
14
+ const SKIP_TOOLS = new Set([
15
+ "screenshot", "screenshot_file",
16
+ "ui_tree", "ui_find", "browser_dom", "browser_page_info", "browser_tabs",
17
+ "ocr", "apps", "windows", "memory_recall", "memory_save", "memory_snapshot",
18
+ "memory_stats", "memory_errors", "memory_query_patterns", "memory_record_error",
19
+ "memory_record_learning", "memory_clear", "platform_guide", "playbook_preflight",
20
+ "export_playbook", "playbook_record", "job_create", "job_status", "job_list",
21
+ "job_run", "job_run_all", "job_create_chain", "job_remove", "job_transition",
22
+ "job_step_done", "job_step_fail", "job_resume", "job_dequeue",
23
+ "worker_start", "worker_stop", "worker_status",
24
+ "supervisor_status", "supervisor_start", "supervisor_stop",
25
+ "supervisor_pause", "supervisor_resume", "supervisor_install", "supervisor_uninstall",
26
+ "session_claim", "session_heartbeat", "session_release",
27
+ "recovery_queue_add", "recovery_queue_list",
28
+ "codex_monitor_start", "codex_monitor_status", "codex_monitor_add_task",
29
+ "codex_monitor_tasks", "codex_monitor_assign_now", "codex_monitor_stop",
30
+ "platform_learn", "platform_explore",
31
+ ]);
32
+ /** Map MCP tool names to PlaybookStep actions */
33
+ function mapToolToAction(toolName) {
34
+ switch (toolName) {
35
+ case "browser_navigate": return "navigate";
36
+ case "click":
37
+ case "click_text":
38
+ case "browser_click":
39
+ case "click_with_fallback":
40
+ case "ui_press": return "press";
41
+ case "type_text":
42
+ case "browser_type":
43
+ case "type_with_fallback": return "type_into";
44
+ case "key": return "key";
45
+ case "menu_click": return "menu_click";
46
+ case "scroll":
47
+ case "scroll_with_fallback": return "scroll";
48
+ case "browser_js": return "browser_js";
49
+ case "screenshot":
50
+ case "screenshot_file": return "screenshot";
51
+ case "browser_wait":
52
+ case "wait_for_state": return "wait";
53
+ case "focus":
54
+ case "launch": return null; // useful context but not a step
55
+ case "drag": return null; // drag is complex, skip for now
56
+ default: return null;
57
+ }
58
+ }
59
+ /** Build a PlaybookStep from an MCP tool call */
60
+ function buildStep(toolName, params, success) {
61
+ const action = mapToolToAction(toolName);
62
+ if (!action)
63
+ return null;
64
+ const step = { action };
65
+ switch (action) {
66
+ case "navigate":
67
+ step.url = String(params.url ?? "");
68
+ step.description = `Navigate to ${step.url}`;
69
+ break;
70
+ case "press":
71
+ step.target = String(params.selector ?? params.text ?? params.title ?? params.target ?? "");
72
+ step.description = `Click ${step.target}`;
73
+ break;
74
+ case "type_into":
75
+ step.target = String(params.selector ?? params.target ?? params.field ?? "");
76
+ step.text = String(params.text ?? params.value ?? "");
77
+ step.description = `Type "${step.text.substring(0, 50)}" into ${step.target}`;
78
+ break;
79
+ case "key":
80
+ case "key_combo": {
81
+ const combo = String(params.combo ?? params.key ?? "");
82
+ step.keys = combo.split("+").map(k => k.trim());
83
+ step.description = `${action === "key" ? "Key" : "Key combo"}: ${combo}`;
84
+ break;
85
+ }
86
+ case "menu_click": {
87
+ const menuPath = Array.isArray(params.menuPath)
88
+ ? params.menuPath.map((part) => String(part).trim()).filter(Boolean)
89
+ : String(params.menuPath ?? "").split("/").map((part) => part.trim()).filter(Boolean);
90
+ step.menuPath = menuPath;
91
+ step.description = `Menu click: ${menuPath.join(" > ")}`;
92
+ break;
93
+ }
94
+ case "scroll":
95
+ step.direction = params.direction ?? "down";
96
+ if (params.amount != null)
97
+ step.amount = Number(params.amount);
98
+ step.description = `Scroll ${step.direction}`;
99
+ break;
100
+ case "browser_js":
101
+ step.code = String(params.code ?? "");
102
+ step.description = `Execute JS: ${step.code.substring(0, 60)}...`;
103
+ break;
104
+ case "screenshot":
105
+ step.description = "Take screenshot";
106
+ break;
107
+ case "wait":
108
+ step.ms = Number(params.timeout ?? params.ms ?? params.timeoutMs ?? 1000);
109
+ step.description = `Wait ${step.ms}ms`;
110
+ break;
111
+ }
112
+ if (!success) {
113
+ step.optional = true;
114
+ }
115
+ return step;
116
+ }
117
+ export class McpPlaybookRecorder {
118
+ playbooksDir;
119
+ recording = false;
120
+ platform = "";
121
+ steps = [];
122
+ startTime = "";
123
+ cdpPort;
124
+ constructor(playbooksDir) {
125
+ this.playbooksDir = playbooksDir;
126
+ }
127
+ get isRecording() { return this.recording; }
128
+ get stepCount() { return this.steps.length; }
129
+ getSteps() { return [...this.steps]; }
130
+ start(platform, cdpPort) {
131
+ this.recording = true;
132
+ this.platform = platform;
133
+ this.steps = [];
134
+ this.startTime = new Date().toISOString();
135
+ if (cdpPort !== undefined)
136
+ this.cdpPort = cdpPort;
137
+ }
138
+ captureToolCall(toolName, params, success, _result, _durationMs) {
139
+ if (!this.recording)
140
+ return;
141
+ if (SKIP_TOOLS.has(toolName))
142
+ return;
143
+ const step = buildStep(toolName, params, success);
144
+ if (!step)
145
+ return;
146
+ // Deduplicate consecutive identical steps
147
+ const last = this.steps[this.steps.length - 1];
148
+ if (last &&
149
+ last.action === step.action &&
150
+ last.target === step.target &&
151
+ last.text === step.text &&
152
+ last.code === step.code &&
153
+ JSON.stringify(last.keys ?? []) === JSON.stringify(step.keys ?? []) &&
154
+ JSON.stringify(last.menuPath ?? []) === JSON.stringify(step.menuPath ?? [])) {
155
+ return; // skip duplicate
156
+ }
157
+ this.steps.push(step);
158
+ }
159
+ stop(name, description) {
160
+ this.recording = false;
161
+ // Sanitize platform to prevent path traversal in filename
162
+ const safePlatform = this.platform.replace(/[^a-zA-Z0-9_\-]/g, "_").slice(0, 100);
163
+ const id = safePlatform + "-" + Date.now().toString(36);
164
+ // S75 Option C: Redact PII in persisted playbook steps and metadata
165
+ const redactedSteps = this.steps.map(s => ({
166
+ ...s,
167
+ ...(s.text ? { text: redactPII(s.text) } : {}),
168
+ ...(typeof s.target === "string" ? { target: redactPII(s.target) } : {}),
169
+ ...(s.url ? { url: redactPII(s.url) } : {}),
170
+ ...(s.code ? { code: redactPII(s.code) } : {}),
171
+ ...(s.description ? { description: redactPII(s.description) } : {}),
172
+ }));
173
+ const playbook = {
174
+ id,
175
+ name: redactPII(name),
176
+ description: redactPII(description),
177
+ platform: this.platform,
178
+ version: "1.0.0",
179
+ tags: [this.platform, "recorded"],
180
+ successCount: 0,
181
+ failCount: 0,
182
+ steps: redactedSteps,
183
+ };
184
+ if (this.cdpPort) {
185
+ playbook.cdpPort = this.cdpPort;
186
+ }
187
+ // Save to playbooks dir
188
+ if (!fs.existsSync(this.playbooksDir)) {
189
+ fs.mkdirSync(this.playbooksDir, { recursive: true });
190
+ }
191
+ const safeFilename = `${id}.json`;
192
+ const resolved = path.resolve(path.join(this.playbooksDir, safeFilename));
193
+ if (!resolved.startsWith(path.resolve(this.playbooksDir))) {
194
+ throw new Error("Invalid playbook path — refusing to write outside playbooks directory");
195
+ }
196
+ writeFileAtomicSync(resolved, JSON.stringify(playbook, null, 2));
197
+ this.steps = [];
198
+ return playbook;
199
+ }
200
+ cancel() {
201
+ this.recording = false;
202
+ this.steps = [];
203
+ }
204
+ }