screenhand 0.1.1 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +193 -109
- package/bin/darwin-arm64/macos-bridge +0 -0
- package/dist/mcp-desktop.js +5876 -0
- package/dist/scripts/codex-monitor-daemon.js +335 -0
- package/dist/scripts/export-help-center.js +112 -0
- package/dist/scripts/marketing-loop.js +117 -0
- package/dist/scripts/observer-daemon.js +288 -0
- package/dist/scripts/orchestrator-daemon.js +399 -0
- package/dist/scripts/supervisor-daemon.js +272 -0
- package/dist/scripts/threads-campaign.js +208 -0
- package/dist/scripts/worker-daemon.js +228 -0
- package/dist/src/agent/cli.js +82 -0
- package/dist/src/agent/loop.js +274 -0
- package/dist/src/community/fetcher.js +109 -0
- package/dist/src/community/index.js +6 -0
- package/dist/src/community/publisher.js +191 -0
- package/dist/src/community/remote-api.js +121 -0
- package/dist/src/community/types.js +3 -0
- package/dist/src/community/validator.js +95 -0
- package/{src/config.ts → dist/src/config.js} +5 -10
- package/dist/src/context-tracker.js +489 -0
- package/{src/index.ts → dist/src/index.js} +32 -52
- package/dist/src/ingestion/coverage-auditor.js +233 -0
- package/dist/src/ingestion/doc-parser.js +164 -0
- package/dist/src/ingestion/index.js +8 -0
- package/dist/src/ingestion/menu-scanner.js +152 -0
- package/dist/src/ingestion/reference-merger.js +186 -0
- package/dist/src/ingestion/shortcut-extractor.js +180 -0
- package/dist/src/ingestion/tutorial-extractor.js +170 -0
- package/dist/src/ingestion/types.js +3 -0
- package/dist/src/jobs/manager.js +305 -0
- package/dist/src/jobs/runner.js +806 -0
- package/dist/src/jobs/store.js +102 -0
- package/dist/src/jobs/types.js +30 -0
- package/dist/src/jobs/worker.js +97 -0
- package/dist/src/learning/engine.js +356 -0
- package/dist/src/learning/index.js +9 -0
- package/dist/src/learning/locator-policy.js +120 -0
- package/dist/src/learning/pattern-policy.js +89 -0
- package/dist/src/learning/recovery-policy.js +116 -0
- package/dist/src/learning/sensor-policy.js +115 -0
- package/dist/src/learning/timing-model.js +204 -0
- package/dist/src/learning/topology-policy.js +90 -0
- package/dist/src/learning/types.js +9 -0
- package/dist/src/logging/timeline-logger.js +48 -0
- package/dist/src/mcp/mcp-stdio-server.js +464 -0
- package/dist/src/mcp/server.js +363 -0
- package/dist/src/mcp-entry.js +60 -0
- package/dist/src/memory/playbook-seeds.js +200 -0
- package/dist/src/memory/recall.js +222 -0
- package/dist/src/memory/research.js +104 -0
- package/dist/src/memory/seeds.js +101 -0
- package/dist/src/memory/service.js +446 -0
- package/dist/src/memory/session.js +169 -0
- package/dist/src/memory/store.js +451 -0
- package/{src/runtime/locator-cache.ts → dist/src/memory/types.js} +1 -17
- package/dist/src/monitor/codex-monitor.js +382 -0
- package/dist/src/monitor/task-queue.js +97 -0
- package/dist/src/monitor/types.js +62 -0
- package/dist/src/native/bridge-client.js +412 -0
- package/{src/native/macos-bridge-client.ts → dist/src/native/macos-bridge-client.js} +0 -1
- package/dist/src/observer/state.js +199 -0
- package/dist/src/observer/types.js +43 -0
- package/dist/src/orchestrator/state.js +68 -0
- package/dist/src/orchestrator/types.js +22 -0
- package/dist/src/perception/ax-source.js +162 -0
- package/dist/src/perception/cdp-source.js +162 -0
- package/dist/src/perception/coordinator.js +771 -0
- package/dist/src/perception/frame-differ.js +287 -0
- package/dist/src/perception/index.js +22 -0
- package/dist/src/perception/manager.js +199 -0
- package/dist/src/perception/types.js +47 -0
- package/dist/src/perception/vision-source.js +399 -0
- package/dist/src/planner/deterministic.js +298 -0
- package/dist/src/planner/executor.js +870 -0
- package/dist/src/planner/goal-store.js +92 -0
- package/dist/src/planner/index.js +21 -0
- package/dist/src/planner/planner.js +520 -0
- package/dist/src/planner/tool-registry.js +71 -0
- package/dist/src/planner/types.js +22 -0
- package/dist/src/platform/explorer.js +213 -0
- package/dist/src/platform/help-center-markdown.js +527 -0
- package/dist/src/platform/learner.js +257 -0
- package/dist/src/playbook/engine.js +486 -0
- package/dist/src/playbook/index.js +20 -0
- package/dist/src/playbook/mcp-recorder.js +204 -0
- package/dist/src/playbook/recorder.js +536 -0
- package/dist/src/playbook/runner.js +408 -0
- package/dist/src/playbook/store.js +312 -0
- package/dist/src/playbook/types.js +17 -0
- package/dist/src/recovery/detectors.js +156 -0
- package/dist/src/recovery/engine.js +327 -0
- package/dist/src/recovery/index.js +20 -0
- package/dist/src/recovery/strategies.js +274 -0
- package/dist/src/recovery/types.js +20 -0
- package/dist/src/runtime/accessibility-adapter.js +430 -0
- package/dist/src/runtime/app-adapter.js +64 -0
- package/dist/src/runtime/applescript-adapter.js +305 -0
- package/dist/src/runtime/ax-role-map.js +96 -0
- package/dist/src/runtime/browser-adapter.js +52 -0
- package/dist/src/runtime/cdp-chrome-adapter.js +521 -0
- package/dist/src/runtime/composite-adapter.js +221 -0
- package/dist/src/runtime/execution-contract.js +159 -0
- package/dist/src/runtime/executor.js +286 -0
- package/dist/src/runtime/locator-cache.js +50 -0
- package/dist/src/runtime/planning-loop.js +63 -0
- package/dist/src/runtime/service.js +432 -0
- package/dist/src/runtime/session-manager.js +63 -0
- package/dist/src/runtime/state-observer.js +121 -0
- package/dist/src/runtime/vision-adapter.js +225 -0
- package/dist/src/state/app-map-types.js +72 -0
- package/dist/src/state/app-map.js +1974 -0
- package/dist/src/state/entity-tracker.js +108 -0
- package/dist/src/state/fusion.js +96 -0
- package/dist/src/state/index.js +21 -0
- package/dist/src/state/ladder-generator.js +236 -0
- package/dist/src/state/persistence.js +156 -0
- package/dist/src/state/types.js +17 -0
- package/dist/src/state/world-model.js +1456 -0
- package/dist/src/supervisor/locks.js +186 -0
- package/dist/src/supervisor/supervisor.js +403 -0
- package/dist/src/supervisor/types.js +30 -0
- package/dist/src/test-mcp-protocol.js +154 -0
- package/dist/src/types.js +17 -0
- package/dist/src/util/atomic-write.js +133 -0
- package/dist/src/util/sanitize.js +146 -0
- package/dist-app-maps/com.figma.Desktop.json +959 -0
- package/dist-app-maps/com.hnc.Discord.json +1146 -0
- package/dist-app-maps/notion.id.json +2831 -0
- package/dist-playbooks/canva-screenhand-carousel.json +445 -0
- package/dist-playbooks/codex-desktop.json +76 -0
- package/dist-playbooks/competitor-research-stack.json +122 -0
- package/dist-playbooks/davinci-color-grade.json +153 -0
- package/dist-playbooks/davinci-edit-timeline.json +162 -0
- package/dist-playbooks/davinci-render.json +114 -0
- package/dist-playbooks/devto.json +52 -0
- package/dist-playbooks/discord.json +41 -0
- package/dist-playbooks/google-flow-create-project.json +59 -0
- package/dist-playbooks/google-flow-edit-image.json +90 -0
- package/dist-playbooks/google-flow-edit-video.json +90 -0
- package/dist-playbooks/google-flow-generate-image.json +68 -0
- package/dist-playbooks/google-flow-generate-video.json +191 -0
- package/dist-playbooks/google-flow-open-project.json +48 -0
- package/dist-playbooks/google-flow-open-scenebuilder.json +64 -0
- package/dist-playbooks/google-flow-search-assets.json +64 -0
- package/dist-playbooks/instagram.json +57 -0
- package/dist-playbooks/linkedin.json +52 -0
- package/dist-playbooks/n8n.json +43 -0
- package/dist-playbooks/reddit.json +52 -0
- package/dist-playbooks/threads.json +59 -0
- package/dist-playbooks/x-twitter.json +59 -0
- package/dist-playbooks/youtube.json +59 -0
- package/dist-references/canva.json +646 -0
- package/dist-references/codex-desktop.json +305 -0
- package/dist-references/davinci-resolve-keyboard.json +594 -0
- package/dist-references/davinci-resolve-menu-map.json +1139 -0
- package/dist-references/davinci-resolve-menus-batch1.json +116 -0
- package/dist-references/davinci-resolve-menus-batch2.json +372 -0
- package/dist-references/davinci-resolve-menus-batch3.json +330 -0
- package/dist-references/davinci-resolve-menus-batch4.json +297 -0
- package/dist-references/davinci-resolve-shortcuts.json +333 -0
- package/dist-references/devto.json +317 -0
- package/dist-references/discord.json +549 -0
- package/dist-references/figma.json +1186 -0
- package/dist-references/finder.json +146 -0
- package/dist-references/google-ads-transparency.json +95 -0
- package/dist-references/google-flow.json +649 -0
- package/dist-references/instagram.json +341 -0
- package/dist-references/linkedin.json +324 -0
- package/dist-references/meta-ad-library.json +86 -0
- package/dist-references/n8n.json +387 -0
- package/dist-references/notes.json +27 -0
- package/dist-references/notion.json +163 -0
- package/dist-references/reddit.json +341 -0
- package/dist-references/threads.json +337 -0
- package/dist-references/x-twitter.json +403 -0
- package/dist-references/youtube.json +373 -0
- package/native/macos-bridge/Package.swift +1 -0
- package/native/macos-bridge/Sources/AccessibilityBridge.swift +257 -36
- package/native/macos-bridge/Sources/AppManagement.swift +212 -2
- package/native/macos-bridge/Sources/CoreGraphicsBridge.swift +348 -53
- package/native/macos-bridge/Sources/StreamCapture.swift +136 -0
- package/native/macos-bridge/Sources/VisionBridge.swift +165 -7
- package/native/macos-bridge/Sources/main.swift +169 -16
- package/native/windows-bridge/Program.cs +5 -0
- package/native/windows-bridge/ScreenCapture.cs +124 -0
- package/package.json +29 -4
- package/scripts/postinstall.cjs +127 -0
- package/.claude/commands/automate.md +0 -28
- package/.claude/commands/debug-ui.md +0 -19
- package/.claude/commands/screenshot.md +0 -15
- package/.github/FUNDING.yml +0 -1
- package/.github/ISSUE_TEMPLATE/bug_report.md +0 -27
- package/.github/ISSUE_TEMPLATE/feature_request.md +0 -20
- package/.mcp.json +0 -8
- package/DESKTOP_MCP_GUIDE.md +0 -92
- package/SECURITY.md +0 -44
- package/docs/architecture.md +0 -47
- package/install-skills.sh +0 -19
- package/mcp-bridge.ts +0 -271
- package/mcp-desktop.ts +0 -1221
- package/playbooks/instagram.json +0 -41
- package/playbooks/instagram_v2.json +0 -201
- package/playbooks/x_v1.json +0 -211
- package/scripts/devpost-live-loop.mjs +0 -421
- package/src/logging/timeline-logger.ts +0 -55
- package/src/mcp/server.ts +0 -449
- package/src/memory/recall.ts +0 -191
- package/src/memory/research.ts +0 -146
- package/src/memory/seeds.ts +0 -123
- package/src/memory/session.ts +0 -201
- package/src/memory/store.ts +0 -434
- package/src/memory/types.ts +0 -69
- package/src/native/bridge-client.ts +0 -239
- package/src/runtime/accessibility-adapter.ts +0 -487
- package/src/runtime/app-adapter.ts +0 -169
- package/src/runtime/applescript-adapter.ts +0 -376
- package/src/runtime/ax-role-map.ts +0 -102
- package/src/runtime/browser-adapter.ts +0 -129
- package/src/runtime/cdp-chrome-adapter.ts +0 -676
- package/src/runtime/composite-adapter.ts +0 -274
- package/src/runtime/executor.ts +0 -396
- package/src/runtime/planning-loop.ts +0 -81
- package/src/runtime/service.ts +0 -448
- package/src/runtime/session-manager.ts +0 -50
- package/src/runtime/state-observer.ts +0 -136
- package/src/runtime/vision-adapter.ts +0 -297
- package/src/types.ts +0 -297
- package/tests/bridge-client.test.ts +0 -176
- package/tests/browser-stealth.test.ts +0 -210
- package/tests/composite-adapter.test.ts +0 -64
- package/tests/mcp-server.test.ts +0 -151
- package/tests/memory-recall.test.ts +0 -339
- package/tests/memory-research.test.ts +0 -159
- package/tests/memory-seeds.test.ts +0 -120
- package/tests/memory-store.test.ts +0 -392
- package/tests/types.test.ts +0 -92
- package/tsconfig.check.json +0 -17
- package/tsconfig.json +0 -19
- package/vitest.config.ts +0 -8
- /package/{playbooks → dist-references}/devpost.json +0 -0
|
@@ -0,0 +1,121 @@
|
|
|
1
|
+
// Copyright (C) 2025 Clazro Technology Private Limited
|
|
2
|
+
// SPDX-License-Identifier: AGPL-3.0-only
|
|
3
|
+
//
|
|
4
|
+
// This file is part of ScreenHand.
|
|
5
|
+
//
|
|
6
|
+
// ScreenHand is free software: you can redistribute it and/or modify
|
|
7
|
+
// it under the terms of the GNU Affero General Public License as
|
|
8
|
+
// published by the Free Software Foundation, version 3.
|
|
9
|
+
//
|
|
10
|
+
// ScreenHand is distributed in the hope that it will be useful,
|
|
11
|
+
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12
|
+
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13
|
+
// GNU Affero General Public License for more details.
|
|
14
|
+
//
|
|
15
|
+
// You should have received a copy of the GNU Affero General Public License
|
|
16
|
+
// along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
|
|
17
|
+
import { EventEmitter } from "node:events";
|
|
18
|
+
/**
|
|
19
|
+
* Wraps the native bridge's AX observer events into typed UIEvent objects.
|
|
20
|
+
* Buffers events for consumption by the planning loop.
|
|
21
|
+
*/
|
|
22
|
+
export class StateObserver extends EventEmitter {
|
|
23
|
+
bridge;
|
|
24
|
+
observedPids = new Set();
|
|
25
|
+
eventBuffer = [];
|
|
26
|
+
maxBufferSize;
|
|
27
|
+
constructor(bridge, maxBufferSize = 200) {
|
|
28
|
+
super();
|
|
29
|
+
this.bridge = bridge;
|
|
30
|
+
this.maxBufferSize = maxBufferSize;
|
|
31
|
+
// Listen for AX events from the bridge
|
|
32
|
+
this.bridge.on("ax-event", (raw) => {
|
|
33
|
+
const event = this.parseEvent(raw);
|
|
34
|
+
if (event) {
|
|
35
|
+
this.eventBuffer.push(event);
|
|
36
|
+
if (this.eventBuffer.length > this.maxBufferSize) {
|
|
37
|
+
this.eventBuffer.shift();
|
|
38
|
+
}
|
|
39
|
+
this.emit("event", event);
|
|
40
|
+
}
|
|
41
|
+
});
|
|
42
|
+
}
|
|
43
|
+
async startObserving(pid, eventTypes) {
|
|
44
|
+
if (this.observedPids.has(pid))
|
|
45
|
+
return;
|
|
46
|
+
const notifications = eventTypes
|
|
47
|
+
? this.mapEventTypesToNotifications(eventTypes)
|
|
48
|
+
: undefined;
|
|
49
|
+
await this.bridge.call("observer.start", {
|
|
50
|
+
pid,
|
|
51
|
+
notifications,
|
|
52
|
+
});
|
|
53
|
+
this.observedPids.add(pid);
|
|
54
|
+
}
|
|
55
|
+
async stopObserving(pid) {
|
|
56
|
+
if (!this.observedPids.has(pid))
|
|
57
|
+
return;
|
|
58
|
+
await this.bridge.call("observer.stop", { pid });
|
|
59
|
+
this.observedPids.delete(pid);
|
|
60
|
+
}
|
|
61
|
+
/** Get and clear the event buffer. */
|
|
62
|
+
drainEvents() {
|
|
63
|
+
const events = [...this.eventBuffer];
|
|
64
|
+
this.eventBuffer = [];
|
|
65
|
+
return events;
|
|
66
|
+
}
|
|
67
|
+
/** Get recent events without clearing. */
|
|
68
|
+
peekEvents(limit = 50) {
|
|
69
|
+
return this.eventBuffer.slice(-limit);
|
|
70
|
+
}
|
|
71
|
+
/** Clear the event buffer. */
|
|
72
|
+
clearEvents() {
|
|
73
|
+
this.eventBuffer = [];
|
|
74
|
+
}
|
|
75
|
+
get isObserving() {
|
|
76
|
+
return this.observedPids.size > 0;
|
|
77
|
+
}
|
|
78
|
+
get observedProcesses() {
|
|
79
|
+
return [...this.observedPids];
|
|
80
|
+
}
|
|
81
|
+
parseEvent(raw) {
|
|
82
|
+
const type = raw.type;
|
|
83
|
+
if (!type)
|
|
84
|
+
return null;
|
|
85
|
+
const event = {
|
|
86
|
+
type,
|
|
87
|
+
timestamp: raw.timestamp ?? new Date().toISOString(),
|
|
88
|
+
pid: raw.pid ?? 0,
|
|
89
|
+
};
|
|
90
|
+
if (typeof raw.bundleId === "string")
|
|
91
|
+
event.bundleId = raw.bundleId;
|
|
92
|
+
if (typeof raw.elementRole === "string")
|
|
93
|
+
event.elementRole = raw.elementRole;
|
|
94
|
+
if (typeof raw.elementLabel === "string")
|
|
95
|
+
event.elementLabel = raw.elementLabel;
|
|
96
|
+
if (typeof raw.oldValue === "string")
|
|
97
|
+
event.oldValue = raw.oldValue;
|
|
98
|
+
if (typeof raw.newValue === "string")
|
|
99
|
+
event.newValue = raw.newValue;
|
|
100
|
+
if (typeof raw.windowTitle === "string")
|
|
101
|
+
event.windowTitle = raw.windowTitle;
|
|
102
|
+
return event;
|
|
103
|
+
}
|
|
104
|
+
mapEventTypesToNotifications(types) {
|
|
105
|
+
const map = {
|
|
106
|
+
value_changed: "AXValueChanged",
|
|
107
|
+
focus_changed: "AXFocusedUIElementChanged",
|
|
108
|
+
window_created: "AXWindowCreated",
|
|
109
|
+
window_closed: "AXUIElementDestroyed",
|
|
110
|
+
title_changed: "AXTitleChanged",
|
|
111
|
+
menu_opened: "AXMenuOpened",
|
|
112
|
+
layout_changed: "AXLayoutChanged",
|
|
113
|
+
dialog_appeared: "AXSheetCreated",
|
|
114
|
+
app_activated: "AXApplicationActivated",
|
|
115
|
+
app_deactivated: "AXApplicationDeactivated",
|
|
116
|
+
};
|
|
117
|
+
return types
|
|
118
|
+
.map((t) => map[t])
|
|
119
|
+
.filter((n) => n !== undefined);
|
|
120
|
+
}
|
|
121
|
+
}
|
|
@@ -0,0 +1,225 @@
|
|
|
1
|
+
// Copyright (C) 2025 Clazro Technology Private Limited
|
|
2
|
+
// SPDX-License-Identifier: AGPL-3.0-only
|
|
3
|
+
//
|
|
4
|
+
// This file is part of ScreenHand.
|
|
5
|
+
//
|
|
6
|
+
// ScreenHand is free software: you can redistribute it and/or modify
|
|
7
|
+
// it under the terms of the GNU Affero General Public License as
|
|
8
|
+
// published by the Free Software Foundation, version 3.
|
|
9
|
+
//
|
|
10
|
+
// ScreenHand is distributed in the hope that it will be useful,
|
|
11
|
+
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12
|
+
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13
|
+
// GNU Affero General Public License for more details.
|
|
14
|
+
//
|
|
15
|
+
// You should have received a copy of the GNU Affero General Public License
|
|
16
|
+
// along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
|
|
17
|
+
import { randomUUID } from "node:crypto";
|
|
18
|
+
const POLL_INTERVAL_MS = 200;
|
|
19
|
+
/**
|
|
20
|
+
* Vision-based adapter for apps with poor/no accessibility support.
|
|
21
|
+
* Uses screenshots + OCR to locate elements and CG events to interact.
|
|
22
|
+
*/
|
|
23
|
+
export class VisionAdapter {
|
|
24
|
+
bridge;
|
|
25
|
+
sessions = new Map();
|
|
26
|
+
sessionsByProfile = new Map();
|
|
27
|
+
constructor(bridge) {
|
|
28
|
+
this.bridge = bridge;
|
|
29
|
+
}
|
|
30
|
+
async attach(profile, reuseSessionId) {
|
|
31
|
+
const existing = this.sessionsByProfile.get(profile);
|
|
32
|
+
if (existing)
|
|
33
|
+
return existing.info;
|
|
34
|
+
await this.bridge.start();
|
|
35
|
+
const frontmost = await this.bridge.call("app.frontmost");
|
|
36
|
+
const info = {
|
|
37
|
+
sessionId: reuseSessionId ?? `vision_session_${profile}_${Date.now()}_${randomUUID().slice(0, 8)}`,
|
|
38
|
+
profile,
|
|
39
|
+
createdAt: new Date().toISOString(),
|
|
40
|
+
adapterType: "vision",
|
|
41
|
+
};
|
|
42
|
+
const state = {
|
|
43
|
+
info,
|
|
44
|
+
pid: frontmost.pid,
|
|
45
|
+
bundleId: frontmost.bundleId,
|
|
46
|
+
appName: frontmost.name,
|
|
47
|
+
};
|
|
48
|
+
this.sessions.set(info.sessionId, state);
|
|
49
|
+
this.sessionsByProfile.set(profile, state);
|
|
50
|
+
return info;
|
|
51
|
+
}
|
|
52
|
+
async getAppContext(sessionId) {
|
|
53
|
+
const state = this.requireSession(sessionId);
|
|
54
|
+
return {
|
|
55
|
+
bundleId: state.bundleId,
|
|
56
|
+
appName: state.appName,
|
|
57
|
+
pid: state.pid,
|
|
58
|
+
windowTitle: state.appName,
|
|
59
|
+
};
|
|
60
|
+
}
|
|
61
|
+
async getPageMeta(sessionId) {
|
|
62
|
+
const ctx = await this.getAppContext(sessionId);
|
|
63
|
+
return {
|
|
64
|
+
url: `app://${ctx.bundleId}`,
|
|
65
|
+
title: ctx.appName,
|
|
66
|
+
};
|
|
67
|
+
}
|
|
68
|
+
async navigate(sessionId, url, _timeoutMs) {
|
|
69
|
+
if (url.startsWith("app://")) {
|
|
70
|
+
const bundleId = url.slice(6);
|
|
71
|
+
const result = await this.bridge.call("app.launch", { bundleId });
|
|
72
|
+
const state = this.requireSession(sessionId);
|
|
73
|
+
state.pid = result.pid;
|
|
74
|
+
state.bundleId = result.bundleId;
|
|
75
|
+
state.appName = result.appName;
|
|
76
|
+
}
|
|
77
|
+
return this.getPageMeta(sessionId);
|
|
78
|
+
}
|
|
79
|
+
async locate(sessionId, target, timeoutMs) {
|
|
80
|
+
const state = this.requireSession(sessionId);
|
|
81
|
+
const deadline = Date.now() + timeoutMs;
|
|
82
|
+
while (Date.now() < deadline) {
|
|
83
|
+
// Take a screenshot
|
|
84
|
+
const screenshotResult = await this.bridge.call("cg.captureScreen", {});
|
|
85
|
+
state.lastScreenshotPath = screenshotResult.path;
|
|
86
|
+
const searchText = this.getSearchText(target);
|
|
87
|
+
if (!searchText) {
|
|
88
|
+
// For coordinate targets, just return coordinates directly
|
|
89
|
+
if (target.type === "coordinates") {
|
|
90
|
+
return {
|
|
91
|
+
handleId: `vision_coords_${target.x}_${target.y}`,
|
|
92
|
+
locatorUsed: "vision:coordinates",
|
|
93
|
+
coordinates: { x: target.x, y: target.y, width: 1, height: 1 },
|
|
94
|
+
};
|
|
95
|
+
}
|
|
96
|
+
return null;
|
|
97
|
+
}
|
|
98
|
+
// OCR the screenshot
|
|
99
|
+
const matches = await this.bridge.call("vision.findText", {
|
|
100
|
+
imagePath: screenshotResult.path,
|
|
101
|
+
searchText,
|
|
102
|
+
});
|
|
103
|
+
if (matches.length > 0) {
|
|
104
|
+
const best = matches.reduce((a, b) => (a.confidence > b.confidence ? a : b));
|
|
105
|
+
return {
|
|
106
|
+
handleId: `vision_${Date.now()}_${Math.random().toString(36).slice(2, 8)}`,
|
|
107
|
+
locatorUsed: `vision:text:${searchText}`,
|
|
108
|
+
label: best.text,
|
|
109
|
+
coordinates: best.bounds,
|
|
110
|
+
};
|
|
111
|
+
}
|
|
112
|
+
await sleep(POLL_INTERVAL_MS);
|
|
113
|
+
}
|
|
114
|
+
return null;
|
|
115
|
+
}
|
|
116
|
+
async click(_sessionId, element) {
|
|
117
|
+
if (!element.coordinates) {
|
|
118
|
+
throw new Error("Vision adapter requires coordinates to click");
|
|
119
|
+
}
|
|
120
|
+
const cx = element.coordinates.x + element.coordinates.width / 2;
|
|
121
|
+
const cy = element.coordinates.y + element.coordinates.height / 2;
|
|
122
|
+
await this.bridge.call("cg.mouseClick", { x: cx, y: cy });
|
|
123
|
+
}
|
|
124
|
+
async setValue(_sessionId, element, text, clear) {
|
|
125
|
+
// Click to focus
|
|
126
|
+
await this.click(_sessionId, element);
|
|
127
|
+
await sleep(100);
|
|
128
|
+
if (clear) {
|
|
129
|
+
await this.bridge.call("cg.keyCombo", { keys: ["cmd", "a"] });
|
|
130
|
+
await sleep(50);
|
|
131
|
+
}
|
|
132
|
+
await this.bridge.call("cg.typeText", { text });
|
|
133
|
+
}
|
|
134
|
+
async getValue(_sessionId, element) {
|
|
135
|
+
// Vision can't reliably read values; return label if available
|
|
136
|
+
return element.label ?? "";
|
|
137
|
+
}
|
|
138
|
+
async waitFor(sessionId, condition, timeoutMs) {
|
|
139
|
+
const deadline = Date.now() + timeoutMs;
|
|
140
|
+
while (Date.now() < deadline) {
|
|
141
|
+
if (condition.type === "text_appears") {
|
|
142
|
+
const found = await this.locate(sessionId, { type: "text", value: condition.text }, 200);
|
|
143
|
+
if (found)
|
|
144
|
+
return true;
|
|
145
|
+
}
|
|
146
|
+
else if (condition.type === "element_exists") {
|
|
147
|
+
const found = await this.locate(sessionId, condition.target, 200);
|
|
148
|
+
if (found)
|
|
149
|
+
return true;
|
|
150
|
+
}
|
|
151
|
+
else if (condition.type === "element_gone") {
|
|
152
|
+
const found = await this.locate(sessionId, condition.target, 200);
|
|
153
|
+
if (!found)
|
|
154
|
+
return true;
|
|
155
|
+
}
|
|
156
|
+
else {
|
|
157
|
+
// Unsupported condition types
|
|
158
|
+
return false;
|
|
159
|
+
}
|
|
160
|
+
await sleep(POLL_INTERVAL_MS);
|
|
161
|
+
}
|
|
162
|
+
return false;
|
|
163
|
+
}
|
|
164
|
+
async extract(sessionId, _target, format) {
|
|
165
|
+
const state = this.requireSession(sessionId);
|
|
166
|
+
// Take a fresh screenshot and OCR it
|
|
167
|
+
const screenshotResult = await this.bridge.call("cg.captureScreen", {});
|
|
168
|
+
state.lastScreenshotPath = screenshotResult.path;
|
|
169
|
+
const ocrResult = await this.bridge.call("vision.ocr", { imagePath: screenshotResult.path });
|
|
170
|
+
if (format === "text") {
|
|
171
|
+
return ocrResult.text;
|
|
172
|
+
}
|
|
173
|
+
if (format === "json") {
|
|
174
|
+
return ocrResult;
|
|
175
|
+
}
|
|
176
|
+
// table format
|
|
177
|
+
return {
|
|
178
|
+
headers: ["text", "confidence", "x", "y", "width", "height"],
|
|
179
|
+
rows: ocrResult.regions.map((r) => [
|
|
180
|
+
r.text,
|
|
181
|
+
r.confidence,
|
|
182
|
+
r.bounds.x,
|
|
183
|
+
r.bounds.y,
|
|
184
|
+
r.bounds.width,
|
|
185
|
+
r.bounds.height,
|
|
186
|
+
]),
|
|
187
|
+
};
|
|
188
|
+
}
|
|
189
|
+
async screenshot(_sessionId, region) {
|
|
190
|
+
const result = await this.bridge.call("cg.captureScreen", region ? { region } : {});
|
|
191
|
+
return result.path;
|
|
192
|
+
}
|
|
193
|
+
async keyCombo(_sessionId, keys) {
|
|
194
|
+
await this.bridge.call("cg.keyCombo", { keys });
|
|
195
|
+
}
|
|
196
|
+
async elementTree(_sessionId, _maxDepth, _root) {
|
|
197
|
+
throw new Error("Vision adapter does not support elementTree — use accessibility adapter");
|
|
198
|
+
}
|
|
199
|
+
// ── Private ──
|
|
200
|
+
requireSession(sessionId) {
|
|
201
|
+
const state = this.sessions.get(sessionId);
|
|
202
|
+
if (!state)
|
|
203
|
+
throw new Error(`Session not found: ${sessionId}`);
|
|
204
|
+
return state;
|
|
205
|
+
}
|
|
206
|
+
getSearchText(target) {
|
|
207
|
+
switch (target.type) {
|
|
208
|
+
case "text":
|
|
209
|
+
return target.value;
|
|
210
|
+
case "role":
|
|
211
|
+
return target.name;
|
|
212
|
+
case "selector":
|
|
213
|
+
return target.value;
|
|
214
|
+
case "ax_attribute":
|
|
215
|
+
return target.value;
|
|
216
|
+
case "image":
|
|
217
|
+
case "coordinates":
|
|
218
|
+
case "ax_path":
|
|
219
|
+
return null;
|
|
220
|
+
}
|
|
221
|
+
}
|
|
222
|
+
}
|
|
223
|
+
function sleep(ms) {
|
|
224
|
+
return new Promise((resolve) => setTimeout(resolve, ms));
|
|
225
|
+
}
|
|
@@ -0,0 +1,72 @@
|
|
|
1
|
+
// Copyright (C) 2025 Clazro Technology Private Limited
|
|
2
|
+
// SPDX-License-Identifier: AGPL-3.0-only
|
|
3
|
+
// ── Rating System (F → 0) ──────────────────────────────────────────
|
|
4
|
+
//
|
|
5
|
+
// Game-style rating: F E D C B A S SS SSS 0
|
|
6
|
+
// Each grade has 3 sub-tiers: e.g. B1 (entry), B2 (mid), B3 (top)
|
|
7
|
+
// Graded by 10 weighted factors scored 0-100
|
|
8
|
+
//
|
|
9
|
+
// Years-equivalent mapping:
|
|
10
|
+
// F = just opened the app
|
|
11
|
+
// E = ~1 week user
|
|
12
|
+
// D = ~1-3 months
|
|
13
|
+
// C = ~6-12 months
|
|
14
|
+
// B = ~1-3 years (consistent daily user)
|
|
15
|
+
// A = ~3-5 years (power user / team lead)
|
|
16
|
+
// S = ~5-10 years (department architect)
|
|
17
|
+
// SS = ~10-20 years (platform expert, builds systems)
|
|
18
|
+
// SSS = ~20+ years (framework builder, trains others)
|
|
19
|
+
// 0 = Class Zero — transcendent mastery, all 10 factors maxed
|
|
20
|
+
/** Rating grades from lowest to highest */
|
|
21
|
+
export const RATING_GRADES = ["F", "E", "D", "C", "B", "A", "S", "SS", "SSS", "0"];
|
|
22
|
+
/** Factor weights — hard-to-fake signals dominate (57%), session-gated evidence (43%) */
|
|
23
|
+
export const RATING_FACTOR_WEIGHTS = {
|
|
24
|
+
consistency: 20, // THE core signal — can't fake showing up 50+ times
|
|
25
|
+
platformKnowledge: 15, // shortcuts, deep features — proves real knowledge
|
|
26
|
+
edgeCaseHandling: 12, // surviving unexpected states — proves resilience
|
|
27
|
+
teachingAbility: 10, // exporting playbooks — proves codifiable mastery
|
|
28
|
+
featureCoverage: 10, // breadth of features used (session-gated)
|
|
29
|
+
workflowDepth: 8, // multi-step workflows completed (session-gated)
|
|
30
|
+
outcomeVerification: 8, // verified outcomes (session-gated)
|
|
31
|
+
errorRecovery: 7, // healing from failures — honest if it happens
|
|
32
|
+
crossFeatureChains: 5, // combining features end-to-end
|
|
33
|
+
speedEfficiency: 5, // repeat mastery across sessions
|
|
34
|
+
};
|
|
35
|
+
export const DEFAULT_APP_MAP_CONFIG = {
|
|
36
|
+
mapsDir: "",
|
|
37
|
+
staleThresholdDays: 7,
|
|
38
|
+
versionDecayFactor: 0.5,
|
|
39
|
+
pruneSessionThreshold: 10,
|
|
40
|
+
maxZonesPerApp: 50,
|
|
41
|
+
maxElementsPerZone: 100,
|
|
42
|
+
maxEdges: 200,
|
|
43
|
+
maxHistoryEntries: 100,
|
|
44
|
+
maxHierarchyEntriesPerZone: 50,
|
|
45
|
+
maxContractsPerZone: 30,
|
|
46
|
+
maxOutcomesPerContract: 5,
|
|
47
|
+
maxStateDimensions: 30,
|
|
48
|
+
maxStateTransitions: 100,
|
|
49
|
+
maxVisibilityConditions: 200,
|
|
50
|
+
maxTimingProfiles: 100,
|
|
51
|
+
maxReadySignals: 50,
|
|
52
|
+
};
|
|
53
|
+
// ── Rating Utility ──────────────────────────────────────────────────
|
|
54
|
+
/** Convert Rating to display string: "B2", "SS3", "0" */
|
|
55
|
+
export function ratingToString(r) {
|
|
56
|
+
if (r.grade === "0")
|
|
57
|
+
return "0"; // Class Zero has no sub-tier display
|
|
58
|
+
return `${r.grade}${r.subTier}`;
|
|
59
|
+
}
|
|
60
|
+
/** Grade thresholds: weighted score needed for each grade (0-100 scale) */
|
|
61
|
+
export const GRADE_THRESHOLDS = [
|
|
62
|
+
{ grade: "0", minScore: 97 }, // Class Zero — near-perfect across all factors
|
|
63
|
+
{ grade: "SSS", minScore: 90 }, // 20+ years equivalent
|
|
64
|
+
{ grade: "SS", minScore: 82 }, // 10-20 years
|
|
65
|
+
{ grade: "S", minScore: 73 }, // 5-10 years
|
|
66
|
+
{ grade: "A", minScore: 62 }, // 3-5 years
|
|
67
|
+
{ grade: "B", minScore: 50 }, // 1-3 years
|
|
68
|
+
{ grade: "C", minScore: 38 }, // 6-12 months
|
|
69
|
+
{ grade: "D", minScore: 25 }, // 1-3 months
|
|
70
|
+
{ grade: "E", minScore: 12 }, // ~1 week
|
|
71
|
+
{ grade: "F", minScore: 0 }, // just opened the app
|
|
72
|
+
];
|