screenhand 0.1.1 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (241) hide show
  1. package/README.md +193 -109
  2. package/bin/darwin-arm64/macos-bridge +0 -0
  3. package/dist/mcp-desktop.js +5876 -0
  4. package/dist/scripts/codex-monitor-daemon.js +335 -0
  5. package/dist/scripts/export-help-center.js +112 -0
  6. package/dist/scripts/marketing-loop.js +117 -0
  7. package/dist/scripts/observer-daemon.js +288 -0
  8. package/dist/scripts/orchestrator-daemon.js +399 -0
  9. package/dist/scripts/supervisor-daemon.js +272 -0
  10. package/dist/scripts/threads-campaign.js +208 -0
  11. package/dist/scripts/worker-daemon.js +228 -0
  12. package/dist/src/agent/cli.js +82 -0
  13. package/dist/src/agent/loop.js +274 -0
  14. package/dist/src/community/fetcher.js +109 -0
  15. package/dist/src/community/index.js +6 -0
  16. package/dist/src/community/publisher.js +191 -0
  17. package/dist/src/community/remote-api.js +121 -0
  18. package/dist/src/community/types.js +3 -0
  19. package/dist/src/community/validator.js +95 -0
  20. package/{src/config.ts → dist/src/config.js} +5 -10
  21. package/dist/src/context-tracker.js +489 -0
  22. package/{src/index.ts → dist/src/index.js} +32 -52
  23. package/dist/src/ingestion/coverage-auditor.js +233 -0
  24. package/dist/src/ingestion/doc-parser.js +164 -0
  25. package/dist/src/ingestion/index.js +8 -0
  26. package/dist/src/ingestion/menu-scanner.js +152 -0
  27. package/dist/src/ingestion/reference-merger.js +186 -0
  28. package/dist/src/ingestion/shortcut-extractor.js +180 -0
  29. package/dist/src/ingestion/tutorial-extractor.js +170 -0
  30. package/dist/src/ingestion/types.js +3 -0
  31. package/dist/src/jobs/manager.js +305 -0
  32. package/dist/src/jobs/runner.js +806 -0
  33. package/dist/src/jobs/store.js +102 -0
  34. package/dist/src/jobs/types.js +30 -0
  35. package/dist/src/jobs/worker.js +97 -0
  36. package/dist/src/learning/engine.js +356 -0
  37. package/dist/src/learning/index.js +9 -0
  38. package/dist/src/learning/locator-policy.js +120 -0
  39. package/dist/src/learning/pattern-policy.js +89 -0
  40. package/dist/src/learning/recovery-policy.js +116 -0
  41. package/dist/src/learning/sensor-policy.js +115 -0
  42. package/dist/src/learning/timing-model.js +204 -0
  43. package/dist/src/learning/topology-policy.js +90 -0
  44. package/dist/src/learning/types.js +9 -0
  45. package/dist/src/logging/timeline-logger.js +48 -0
  46. package/dist/src/mcp/mcp-stdio-server.js +464 -0
  47. package/dist/src/mcp/server.js +363 -0
  48. package/dist/src/mcp-entry.js +60 -0
  49. package/dist/src/memory/playbook-seeds.js +200 -0
  50. package/dist/src/memory/recall.js +222 -0
  51. package/dist/src/memory/research.js +104 -0
  52. package/dist/src/memory/seeds.js +101 -0
  53. package/dist/src/memory/service.js +446 -0
  54. package/dist/src/memory/session.js +169 -0
  55. package/dist/src/memory/store.js +451 -0
  56. package/{src/runtime/locator-cache.ts → dist/src/memory/types.js} +1 -17
  57. package/dist/src/monitor/codex-monitor.js +382 -0
  58. package/dist/src/monitor/task-queue.js +97 -0
  59. package/dist/src/monitor/types.js +62 -0
  60. package/dist/src/native/bridge-client.js +412 -0
  61. package/{src/native/macos-bridge-client.ts → dist/src/native/macos-bridge-client.js} +0 -1
  62. package/dist/src/observer/state.js +199 -0
  63. package/dist/src/observer/types.js +43 -0
  64. package/dist/src/orchestrator/state.js +68 -0
  65. package/dist/src/orchestrator/types.js +22 -0
  66. package/dist/src/perception/ax-source.js +162 -0
  67. package/dist/src/perception/cdp-source.js +162 -0
  68. package/dist/src/perception/coordinator.js +771 -0
  69. package/dist/src/perception/frame-differ.js +287 -0
  70. package/dist/src/perception/index.js +22 -0
  71. package/dist/src/perception/manager.js +199 -0
  72. package/dist/src/perception/types.js +47 -0
  73. package/dist/src/perception/vision-source.js +399 -0
  74. package/dist/src/planner/deterministic.js +298 -0
  75. package/dist/src/planner/executor.js +870 -0
  76. package/dist/src/planner/goal-store.js +92 -0
  77. package/dist/src/planner/index.js +21 -0
  78. package/dist/src/planner/planner.js +520 -0
  79. package/dist/src/planner/tool-registry.js +71 -0
  80. package/dist/src/planner/types.js +22 -0
  81. package/dist/src/platform/explorer.js +213 -0
  82. package/dist/src/platform/help-center-markdown.js +527 -0
  83. package/dist/src/platform/learner.js +257 -0
  84. package/dist/src/playbook/engine.js +486 -0
  85. package/dist/src/playbook/index.js +20 -0
  86. package/dist/src/playbook/mcp-recorder.js +204 -0
  87. package/dist/src/playbook/recorder.js +536 -0
  88. package/dist/src/playbook/runner.js +408 -0
  89. package/dist/src/playbook/store.js +312 -0
  90. package/dist/src/playbook/types.js +17 -0
  91. package/dist/src/recovery/detectors.js +156 -0
  92. package/dist/src/recovery/engine.js +327 -0
  93. package/dist/src/recovery/index.js +20 -0
  94. package/dist/src/recovery/strategies.js +274 -0
  95. package/dist/src/recovery/types.js +20 -0
  96. package/dist/src/runtime/accessibility-adapter.js +430 -0
  97. package/dist/src/runtime/app-adapter.js +64 -0
  98. package/dist/src/runtime/applescript-adapter.js +305 -0
  99. package/dist/src/runtime/ax-role-map.js +96 -0
  100. package/dist/src/runtime/browser-adapter.js +52 -0
  101. package/dist/src/runtime/cdp-chrome-adapter.js +521 -0
  102. package/dist/src/runtime/composite-adapter.js +221 -0
  103. package/dist/src/runtime/execution-contract.js +159 -0
  104. package/dist/src/runtime/executor.js +286 -0
  105. package/dist/src/runtime/locator-cache.js +50 -0
  106. package/dist/src/runtime/planning-loop.js +63 -0
  107. package/dist/src/runtime/service.js +432 -0
  108. package/dist/src/runtime/session-manager.js +63 -0
  109. package/dist/src/runtime/state-observer.js +121 -0
  110. package/dist/src/runtime/vision-adapter.js +225 -0
  111. package/dist/src/state/app-map-types.js +72 -0
  112. package/dist/src/state/app-map.js +1974 -0
  113. package/dist/src/state/entity-tracker.js +108 -0
  114. package/dist/src/state/fusion.js +96 -0
  115. package/dist/src/state/index.js +21 -0
  116. package/dist/src/state/ladder-generator.js +236 -0
  117. package/dist/src/state/persistence.js +156 -0
  118. package/dist/src/state/types.js +17 -0
  119. package/dist/src/state/world-model.js +1456 -0
  120. package/dist/src/supervisor/locks.js +186 -0
  121. package/dist/src/supervisor/supervisor.js +403 -0
  122. package/dist/src/supervisor/types.js +30 -0
  123. package/dist/src/test-mcp-protocol.js +154 -0
  124. package/dist/src/types.js +17 -0
  125. package/dist/src/util/atomic-write.js +133 -0
  126. package/dist/src/util/sanitize.js +146 -0
  127. package/dist-app-maps/com.figma.Desktop.json +959 -0
  128. package/dist-app-maps/com.hnc.Discord.json +1146 -0
  129. package/dist-app-maps/notion.id.json +2831 -0
  130. package/dist-playbooks/canva-screenhand-carousel.json +445 -0
  131. package/dist-playbooks/codex-desktop.json +76 -0
  132. package/dist-playbooks/competitor-research-stack.json +122 -0
  133. package/dist-playbooks/davinci-color-grade.json +153 -0
  134. package/dist-playbooks/davinci-edit-timeline.json +162 -0
  135. package/dist-playbooks/davinci-render.json +114 -0
  136. package/dist-playbooks/devto.json +52 -0
  137. package/dist-playbooks/discord.json +41 -0
  138. package/dist-playbooks/google-flow-create-project.json +59 -0
  139. package/dist-playbooks/google-flow-edit-image.json +90 -0
  140. package/dist-playbooks/google-flow-edit-video.json +90 -0
  141. package/dist-playbooks/google-flow-generate-image.json +68 -0
  142. package/dist-playbooks/google-flow-generate-video.json +191 -0
  143. package/dist-playbooks/google-flow-open-project.json +48 -0
  144. package/dist-playbooks/google-flow-open-scenebuilder.json +64 -0
  145. package/dist-playbooks/google-flow-search-assets.json +64 -0
  146. package/dist-playbooks/instagram.json +57 -0
  147. package/dist-playbooks/linkedin.json +52 -0
  148. package/dist-playbooks/n8n.json +43 -0
  149. package/dist-playbooks/reddit.json +52 -0
  150. package/dist-playbooks/threads.json +59 -0
  151. package/dist-playbooks/x-twitter.json +59 -0
  152. package/dist-playbooks/youtube.json +59 -0
  153. package/dist-references/canva.json +646 -0
  154. package/dist-references/codex-desktop.json +305 -0
  155. package/dist-references/davinci-resolve-keyboard.json +594 -0
  156. package/dist-references/davinci-resolve-menu-map.json +1139 -0
  157. package/dist-references/davinci-resolve-menus-batch1.json +116 -0
  158. package/dist-references/davinci-resolve-menus-batch2.json +372 -0
  159. package/dist-references/davinci-resolve-menus-batch3.json +330 -0
  160. package/dist-references/davinci-resolve-menus-batch4.json +297 -0
  161. package/dist-references/davinci-resolve-shortcuts.json +333 -0
  162. package/dist-references/devto.json +317 -0
  163. package/dist-references/discord.json +549 -0
  164. package/dist-references/figma.json +1186 -0
  165. package/dist-references/finder.json +146 -0
  166. package/dist-references/google-ads-transparency.json +95 -0
  167. package/dist-references/google-flow.json +649 -0
  168. package/dist-references/instagram.json +341 -0
  169. package/dist-references/linkedin.json +324 -0
  170. package/dist-references/meta-ad-library.json +86 -0
  171. package/dist-references/n8n.json +387 -0
  172. package/dist-references/notes.json +27 -0
  173. package/dist-references/notion.json +163 -0
  174. package/dist-references/reddit.json +341 -0
  175. package/dist-references/threads.json +337 -0
  176. package/dist-references/x-twitter.json +403 -0
  177. package/dist-references/youtube.json +373 -0
  178. package/native/macos-bridge/Package.swift +1 -0
  179. package/native/macos-bridge/Sources/AccessibilityBridge.swift +257 -36
  180. package/native/macos-bridge/Sources/AppManagement.swift +212 -2
  181. package/native/macos-bridge/Sources/CoreGraphicsBridge.swift +348 -53
  182. package/native/macos-bridge/Sources/StreamCapture.swift +136 -0
  183. package/native/macos-bridge/Sources/VisionBridge.swift +165 -7
  184. package/native/macos-bridge/Sources/main.swift +169 -16
  185. package/native/windows-bridge/Program.cs +5 -0
  186. package/native/windows-bridge/ScreenCapture.cs +124 -0
  187. package/package.json +29 -4
  188. package/scripts/postinstall.cjs +127 -0
  189. package/.claude/commands/automate.md +0 -28
  190. package/.claude/commands/debug-ui.md +0 -19
  191. package/.claude/commands/screenshot.md +0 -15
  192. package/.github/FUNDING.yml +0 -1
  193. package/.github/ISSUE_TEMPLATE/bug_report.md +0 -27
  194. package/.github/ISSUE_TEMPLATE/feature_request.md +0 -20
  195. package/.mcp.json +0 -8
  196. package/DESKTOP_MCP_GUIDE.md +0 -92
  197. package/SECURITY.md +0 -44
  198. package/docs/architecture.md +0 -47
  199. package/install-skills.sh +0 -19
  200. package/mcp-bridge.ts +0 -271
  201. package/mcp-desktop.ts +0 -1221
  202. package/playbooks/instagram.json +0 -41
  203. package/playbooks/instagram_v2.json +0 -201
  204. package/playbooks/x_v1.json +0 -211
  205. package/scripts/devpost-live-loop.mjs +0 -421
  206. package/src/logging/timeline-logger.ts +0 -55
  207. package/src/mcp/server.ts +0 -449
  208. package/src/memory/recall.ts +0 -191
  209. package/src/memory/research.ts +0 -146
  210. package/src/memory/seeds.ts +0 -123
  211. package/src/memory/session.ts +0 -201
  212. package/src/memory/store.ts +0 -434
  213. package/src/memory/types.ts +0 -69
  214. package/src/native/bridge-client.ts +0 -239
  215. package/src/runtime/accessibility-adapter.ts +0 -487
  216. package/src/runtime/app-adapter.ts +0 -169
  217. package/src/runtime/applescript-adapter.ts +0 -376
  218. package/src/runtime/ax-role-map.ts +0 -102
  219. package/src/runtime/browser-adapter.ts +0 -129
  220. package/src/runtime/cdp-chrome-adapter.ts +0 -676
  221. package/src/runtime/composite-adapter.ts +0 -274
  222. package/src/runtime/executor.ts +0 -396
  223. package/src/runtime/planning-loop.ts +0 -81
  224. package/src/runtime/service.ts +0 -448
  225. package/src/runtime/session-manager.ts +0 -50
  226. package/src/runtime/state-observer.ts +0 -136
  227. package/src/runtime/vision-adapter.ts +0 -297
  228. package/src/types.ts +0 -297
  229. package/tests/bridge-client.test.ts +0 -176
  230. package/tests/browser-stealth.test.ts +0 -210
  231. package/tests/composite-adapter.test.ts +0 -64
  232. package/tests/mcp-server.test.ts +0 -151
  233. package/tests/memory-recall.test.ts +0 -339
  234. package/tests/memory-research.test.ts +0 -159
  235. package/tests/memory-seeds.test.ts +0 -120
  236. package/tests/memory-store.test.ts +0 -392
  237. package/tests/types.test.ts +0 -92
  238. package/tsconfig.check.json +0 -17
  239. package/tsconfig.json +0 -19
  240. package/vitest.config.ts +0 -8
  241. /package/{playbooks → dist-references}/devpost.json +0 -0
@@ -1,146 +0,0 @@
1
- // Copyright (C) 2025 Clazro Technology Private Limited
2
- // SPDX-License-Identifier: AGPL-3.0-only
3
- //
4
- // This file is part of ScreenHand.
5
- //
6
- // ScreenHand is free software: you can redistribute it and/or modify
7
- // it under the terms of the GNU Affero General Public License as
8
- // published by the Free Software Foundation, version 3.
9
- //
10
- // ScreenHand is distributed in the hope that it will be useful,
11
- // but WITHOUT ANY WARRANTY; without even the implied warranty of
12
- // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
- // GNU Affero General Public License for more details.
14
- //
15
- // You should have received a copy of the GNU Affero General Public License
16
- // along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
17
-
18
- /**
19
- * Background web research — fire-and-forget resolution lookup.
20
- *
21
- * When a tool fails and no resolution exists, this searches for a fix
22
- * in the background (non-blocking) and saves it for next time.
23
- *
24
- * Resolution paths:
25
- * 1. Claude API (haiku) — if ANTHROPIC_API_KEY is set
26
- * 2. DuckDuckGo instant answer — free fallback, no auth
27
- */
28
-
29
- import type { MemoryStore } from "./store.js";
30
-
31
- export function backgroundResearch(
32
- store: MemoryStore,
33
- tool: string,
34
- params: Record<string, unknown>,
35
- errorMessage: string,
36
- ): void {
37
- // Fire-and-forget — never blocks, never throws
38
- doResearch(store, tool, params, errorMessage).catch(() => {});
39
- }
40
-
41
- async function doResearch(
42
- store: MemoryStore,
43
- tool: string,
44
- params: Record<string, unknown>,
45
- errorMessage: string,
46
- ): Promise<void> {
47
- const query = `macOS automation: "${tool}" failed with "${errorMessage.slice(0, 200)}"`;
48
-
49
- let resolution: string | null = null;
50
-
51
- const apiKey = process.env["ANTHROPIC_API_KEY"];
52
- if (apiKey) {
53
- resolution = await tryClaudeAPI(apiKey, query);
54
- }
55
-
56
- if (!resolution) {
57
- resolution = await tryDuckDuckGo(query);
58
- }
59
-
60
- if (!resolution) return;
61
-
62
- // Save resolution to error cache
63
- store.appendError({
64
- id: "err_research_" + Date.now().toString(36),
65
- tool,
66
- params,
67
- error: errorMessage,
68
- resolution,
69
- occurrences: 1,
70
- lastSeen: new Date().toISOString(),
71
- });
72
-
73
- // Save as a reusable strategy
74
- store.appendStrategy({
75
- id: "str_research_" + Date.now().toString(36),
76
- task: `Fix: ${tool} — ${errorMessage.slice(0, 100)}`,
77
- steps: [{ tool, params }],
78
- totalDurationMs: 0,
79
- successCount: 1,
80
- failCount: 0,
81
- lastUsed: new Date().toISOString(),
82
- tags: [tool, "research", "fix"],
83
- fingerprint: "",
84
- });
85
- }
86
-
87
- async function tryClaudeAPI(apiKey: string, query: string): Promise<string | null> {
88
- try {
89
- const controller = new AbortController();
90
- const timeout = setTimeout(() => controller.abort(), 10000);
91
-
92
- const response = await fetch("https://api.anthropic.com/v1/messages", {
93
- method: "POST",
94
- headers: {
95
- "Content-Type": "application/json",
96
- "x-api-key": apiKey,
97
- "anthropic-version": "2023-06-01",
98
- },
99
- body: JSON.stringify({
100
- model: "claude-haiku-4-5-20251001",
101
- max_tokens: 200,
102
- messages: [{
103
- role: "user",
104
- content: `You are a macOS automation expert. Give a brief fix (1-2 sentences) for this error:\n\n${query}`,
105
- }],
106
- }),
107
- signal: controller.signal,
108
- });
109
-
110
- clearTimeout(timeout);
111
-
112
- if (!response.ok) return null;
113
-
114
- const data = await response.json() as {
115
- content?: Array<{ type: string; text?: string }>;
116
- };
117
- const text = data.content?.[0]?.text;
118
- return text && text.length > 10 ? text.trim() : null;
119
- } catch {
120
- return null;
121
- }
122
- }
123
-
124
- async function tryDuckDuckGo(query: string): Promise<string | null> {
125
- try {
126
- const controller = new AbortController();
127
- const timeout = setTimeout(() => controller.abort(), 5000);
128
-
129
- const url = `https://api.duckduckgo.com/?q=${encodeURIComponent(query)}&format=json&no_html=1`;
130
- const response = await fetch(url, { signal: controller.signal });
131
-
132
- clearTimeout(timeout);
133
-
134
- if (!response.ok) return null;
135
-
136
- const data = await response.json() as {
137
- AbstractText?: string;
138
- Abstract?: string;
139
- Answer?: string;
140
- };
141
- const text = data.AbstractText || data.Abstract || data.Answer;
142
- return text && text.length > 10 ? text.trim() : null;
143
- } catch {
144
- return null;
145
- }
146
- }
@@ -1,123 +0,0 @@
1
- // Copyright (C) 2025 Clazro Technology Private Limited
2
- // SPDX-License-Identifier: AGPL-3.0-only
3
- //
4
- // This file is part of ScreenHand.
5
- //
6
- // ScreenHand is free software: you can redistribute it and/or modify
7
- // it under the terms of the GNU Affero General Public License as
8
- // published by the Free Software Foundation, version 3.
9
- //
10
- // ScreenHand is distributed in the hope that it will be useful,
11
- // but WITHOUT ANY WARRANTY; without even the implied warranty of
12
- // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
- // GNU Affero General Public License for more details.
14
- //
15
- // You should have received a copy of the GNU Affero General Public License
16
- // along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
17
-
18
- /**
19
- * Predefined seed strategies — common macOS desktop workflows.
20
- * Loaded on first boot so the memory system has knowledge from day one.
21
- */
22
-
23
- import type { Strategy, StrategyStep } from "./types.js";
24
-
25
- let seedCounter = 0;
26
-
27
- function makeFingerprint(tools: string[]): string {
28
- return tools.join("→");
29
- }
30
-
31
- function seed(task: string, steps: StrategyStep[], tags: string[]): Strategy {
32
- seedCounter++;
33
- return {
34
- id: `seed_${String(seedCounter).padStart(3, "0")}`,
35
- task,
36
- steps,
37
- totalDurationMs: 0,
38
- successCount: 10,
39
- failCount: 0,
40
- lastUsed: new Date().toISOString(),
41
- tags,
42
- fingerprint: makeFingerprint(steps.map((s) => s.tool)),
43
- };
44
- }
45
-
46
- export const SEED_STRATEGIES: Strategy[] = [
47
- // 1. Take a photo with Photo Booth
48
- seed("Take a photo with Photo Booth", [
49
- { tool: "launch", params: { bundleId: "com.apple.PhotoBooth" } },
50
- { tool: "ui_press", params: { title: "Take Photo" } },
51
- ], ["photo", "booth", "camera"]),
52
-
53
- // 2. Open a URL in Chrome
54
- seed("Open a URL in Chrome", [
55
- { tool: "launch", params: { bundleId: "com.google.Chrome" } },
56
- { tool: "browser_navigate", params: { url: "" } },
57
- ], ["chrome", "browse", "url"]),
58
-
59
- // 3. Save current document
60
- seed("Save current document", [
61
- { tool: "focus", params: { bundleId: "" } },
62
- { tool: "key", params: { combo: "cmd+s" } },
63
- ], ["save", "document"]),
64
-
65
- // 4. Copy from one app and paste into another
66
- seed("Copy from one app and paste into another", [
67
- { tool: "focus", params: { bundleId: "" } },
68
- { tool: "key", params: { combo: "cmd+c" } },
69
- { tool: "focus", params: { bundleId: "" } },
70
- { tool: "key", params: { combo: "cmd+v" } },
71
- ], ["copy", "paste"]),
72
-
73
- // 5. Navigate to a folder in Finder
74
- seed("Navigate to a folder in Finder", [
75
- { tool: "focus", params: { bundleId: "com.apple.finder" } },
76
- { tool: "key", params: { combo: "cmd+shift+g" } },
77
- { tool: "type_text", params: { text: "" } },
78
- ], ["finder", "folder", "navigate"]),
79
-
80
- // 6. Create a new folder in Finder
81
- seed("Create a new folder in Finder", [
82
- { tool: "focus", params: { bundleId: "com.apple.finder" } },
83
- { tool: "key", params: { combo: "cmd+shift+n" } },
84
- { tool: "type_text", params: { text: "" } },
85
- ], ["finder", "folder", "create"]),
86
-
87
- // 7. Close the current window
88
- seed("Close the current window", [
89
- { tool: "focus", params: { bundleId: "" } },
90
- { tool: "key", params: { combo: "cmd+w" } },
91
- ], ["close", "window"]),
92
-
93
- // 8. Select all and copy
94
- seed("Select all content and copy", [
95
- { tool: "focus", params: { bundleId: "" } },
96
- { tool: "key", params: { combo: "cmd+a" } },
97
- { tool: "key", params: { combo: "cmd+c" } },
98
- ], ["select", "all", "copy"]),
99
-
100
- // 9. List running apps
101
- seed("List all running applications", [
102
- { tool: "apps", params: {} },
103
- ], ["apps", "list", "running"]),
104
-
105
- // 10. Inspect app UI tree
106
- seed("Inspect an app's UI element tree", [
107
- { tool: "focus", params: { bundleId: "" } },
108
- { tool: "ui_tree", params: { pid: 0 } },
109
- ], ["inspect", "tree", "accessibility"]),
110
-
111
- // 11. Open a new tab in Chrome and navigate
112
- seed("Open a new Chrome tab and navigate to URL", [
113
- { tool: "focus", params: { bundleId: "com.google.Chrome" } },
114
- { tool: "key", params: { combo: "cmd+t" } },
115
- { tool: "browser_navigate", params: { url: "" } },
116
- ], ["chrome", "tab", "new"]),
117
-
118
- // 12. Export as PDF via menu
119
- seed("Export document as PDF", [
120
- { tool: "focus", params: { bundleId: "" } },
121
- { tool: "menu_click", params: { menuPath: "File/Export as PDF" } },
122
- ], ["export", "pdf"]),
123
- ];
@@ -1,201 +0,0 @@
1
- // Copyright (C) 2025 Clazro Technology Private Limited
2
- // SPDX-License-Identifier: AGPL-3.0-only
3
- //
4
- // This file is part of ScreenHand.
5
- //
6
- // ScreenHand is free software: you can redistribute it and/or modify
7
- // it under the terms of the GNU Affero General Public License as
8
- // published by the Free Software Foundation, version 3.
9
- //
10
- // ScreenHand is distributed in the hope that it will be useful,
11
- // but WITHOUT ANY WARRANTY; without even the implied warranty of
12
- // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
- // GNU Affero General Public License for more details.
14
- //
15
- // You should have received a copy of the GNU Affero General Public License
16
- // along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
17
-
18
- /**
19
- * Learning Memory — Session tracking with auto-save
20
- *
21
- * Tracks a rolling buffer of actions within a "task session".
22
- * Auto-saves strategies when a successful sequence is detected:
23
- * - 3+ consecutive successes followed by a gap (>60s) or session end
24
- * - Or explicit endSession() call
25
- */
26
-
27
- import type { ActionEntry, Strategy, StrategyStep } from "./types.js";
28
- import { MemoryStore } from "./store.js";
29
- import type { RecallEngine } from "./recall.js";
30
-
31
- const SESSION_GAP_MS = 60_000; // 60s gap = new session
32
- const MAX_BUFFER_SIZE = 100;
33
- const MIN_AUTO_SAVE_STEPS = 3; // Need at least 3 successful steps to auto-save
34
-
35
- export class SessionTracker {
36
- private store: MemoryStore;
37
- private sessionId: string;
38
- private taskDescription: string | null = null;
39
- private buffer: ActionEntry[] = [];
40
- private lastActionTime = 0;
41
-
42
- constructor(store: MemoryStore) {
43
- this.store = store;
44
- this.sessionId = SessionTracker.generateId();
45
- }
46
-
47
- private static generateId(): string {
48
- return "s_" + Date.now().toString(36) + Math.random().toString(36).slice(2, 6);
49
- }
50
-
51
- /** Start (or restart) a named task session */
52
- startSession(taskDescription?: string): string {
53
- // Auto-save previous session if it had successful actions
54
- this.tryAutoSave();
55
-
56
- this.sessionId = SessionTracker.generateId();
57
- this.taskDescription = taskDescription ?? null;
58
- this.buffer = [];
59
- this.lastActionTime = Date.now();
60
- return this.sessionId;
61
- }
62
-
63
- /** Get the current session ID, auto-rotating if stale */
64
- getSessionId(): string {
65
- const now = Date.now();
66
- if (this.lastActionTime > 0 && now - this.lastActionTime > SESSION_GAP_MS) {
67
- // Session gap detected — auto-save previous sequence then start fresh
68
- this.tryAutoSave();
69
- this.sessionId = SessionTracker.generateId();
70
- this.buffer = [];
71
- this.taskDescription = null;
72
- }
73
- return this.sessionId;
74
- }
75
-
76
- /** Record an action into the current session buffer */
77
- recordAction(entry: ActionEntry): void {
78
- const now = Date.now();
79
- if (this.lastActionTime > 0 && now - this.lastActionTime > SESSION_GAP_MS) {
80
- // Gap detected — auto-save then start new session
81
- this.tryAutoSave();
82
- this.sessionId = SessionTracker.generateId();
83
- this.buffer = [];
84
- this.taskDescription = null;
85
- }
86
- this.lastActionTime = now;
87
-
88
- this.buffer.push(entry);
89
- if (this.buffer.length > MAX_BUFFER_SIZE) {
90
- this.buffer.shift();
91
- }
92
- }
93
-
94
- /** End the session and save a strategy if successful */
95
- endSession(success: boolean, taskDescription?: string): Strategy | null {
96
- const task = taskDescription ?? this.taskDescription;
97
- if (!success || !task || this.buffer.length === 0) {
98
- this.buffer = [];
99
- return null;
100
- }
101
-
102
- const strategy = this.buildStrategy(task, this.buffer);
103
- this.store.appendStrategy(strategy);
104
- this.buffer = [];
105
- return strategy;
106
- }
107
-
108
- /** Get the current session's action buffer */
109
- getBuffer(): ActionEntry[] {
110
- return [...this.buffer];
111
- }
112
-
113
- /** Get recent tool names (for strategy hint matching) */
114
- getRecentToolNames(limit = 10): string[] {
115
- return this.buffer.slice(-limit).map((a) => a.tool);
116
- }
117
-
118
- /** Get current task description */
119
- getTaskDescription(): string | null {
120
- return this.taskDescription;
121
- }
122
-
123
- // ── auto-save logic ────────────────────────────
124
-
125
- /**
126
- * Try to auto-save the current buffer as a strategy.
127
- * Only saves if there are MIN_AUTO_SAVE_STEPS+ consecutive successes.
128
- * Uses tool sequence as task description if no explicit one was given.
129
- */
130
- private tryAutoSave(): void {
131
- if (this.buffer.length < MIN_AUTO_SAVE_STEPS) return;
132
-
133
- // Find the longest trailing streak of successes
134
- let successStreak: ActionEntry[] = [];
135
- for (let i = this.buffer.length - 1; i >= 0; i--) {
136
- if (this.buffer[i]!.success) {
137
- successStreak.unshift(this.buffer[i]!);
138
- } else {
139
- break;
140
- }
141
- }
142
-
143
- if (successStreak.length < MIN_AUTO_SAVE_STEPS) return;
144
-
145
- // Build a task description from the tool sequence if none provided
146
- const task = this.taskDescription ?? this.inferTaskDescription(successStreak);
147
-
148
- const strategy = this.buildStrategy(task, successStreak);
149
- this.store.appendStrategy(strategy);
150
- }
151
-
152
- /** Infer a task description from a sequence of actions */
153
- private inferTaskDescription(actions: ActionEntry[]): string {
154
- const tools = [...new Set(actions.map((a) => a.tool))];
155
- // Extract key param values (bundle IDs, titles, URLs, etc.)
156
- const keyParams: string[] = [];
157
- for (const a of actions) {
158
- for (const [key, val] of Object.entries(a.params)) {
159
- if (typeof val === "string" && val.length > 2 && val.length < 60) {
160
- if (["bundleId", "title", "url", "text", "script", "selector", "menuPath"].includes(key)) {
161
- keyParams.push(val);
162
- }
163
- }
164
- }
165
- }
166
- const paramHint = keyParams.length > 0 ? ` (${keyParams.slice(0, 3).join(", ")})` : "";
167
- return `${tools.join(" → ")}${paramHint}`;
168
- }
169
-
170
- private buildStrategy(task: string, actions: ActionEntry[]): Strategy {
171
- const steps: StrategyStep[] = actions.map((a) => ({
172
- tool: a.tool,
173
- params: a.params,
174
- }));
175
-
176
- const totalDurationMs = actions.reduce((sum, a) => sum + a.durationMs, 0);
177
- const tags = extractTags(task, steps);
178
- const fingerprint = MemoryStore.makeFingerprint(steps.map((s) => s.tool));
179
-
180
- return {
181
- id: "str_" + Date.now().toString(36) + Math.random().toString(36).slice(2, 6),
182
- task,
183
- steps,
184
- totalDurationMs,
185
- successCount: 1,
186
- failCount: 0,
187
- lastUsed: new Date().toISOString(),
188
- tags,
189
- fingerprint,
190
- };
191
- }
192
- }
193
-
194
- /** Extract tags from task description and tool names */
195
- function extractTags(task: string, steps: StrategyStep[]): string[] {
196
- const tags = new Set<string>();
197
- const words = task.toLowerCase().split(/\W+/).filter((w) => w.length >= 3);
198
- for (const w of words) tags.add(w);
199
- for (const s of steps) tags.add(s.tool);
200
- return [...tags];
201
- }