screenhand 0.1.1 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +193 -109
- package/bin/darwin-arm64/macos-bridge +0 -0
- package/dist/mcp-desktop.js +5876 -0
- package/dist/scripts/codex-monitor-daemon.js +335 -0
- package/dist/scripts/export-help-center.js +112 -0
- package/dist/scripts/marketing-loop.js +117 -0
- package/dist/scripts/observer-daemon.js +288 -0
- package/dist/scripts/orchestrator-daemon.js +399 -0
- package/dist/scripts/supervisor-daemon.js +272 -0
- package/dist/scripts/threads-campaign.js +208 -0
- package/dist/scripts/worker-daemon.js +228 -0
- package/dist/src/agent/cli.js +82 -0
- package/dist/src/agent/loop.js +274 -0
- package/dist/src/community/fetcher.js +109 -0
- package/dist/src/community/index.js +6 -0
- package/dist/src/community/publisher.js +191 -0
- package/dist/src/community/remote-api.js +121 -0
- package/dist/src/community/types.js +3 -0
- package/dist/src/community/validator.js +95 -0
- package/{src/config.ts → dist/src/config.js} +5 -10
- package/dist/src/context-tracker.js +489 -0
- package/{src/index.ts → dist/src/index.js} +32 -52
- package/dist/src/ingestion/coverage-auditor.js +233 -0
- package/dist/src/ingestion/doc-parser.js +164 -0
- package/dist/src/ingestion/index.js +8 -0
- package/dist/src/ingestion/menu-scanner.js +152 -0
- package/dist/src/ingestion/reference-merger.js +186 -0
- package/dist/src/ingestion/shortcut-extractor.js +180 -0
- package/dist/src/ingestion/tutorial-extractor.js +170 -0
- package/dist/src/ingestion/types.js +3 -0
- package/dist/src/jobs/manager.js +305 -0
- package/dist/src/jobs/runner.js +806 -0
- package/dist/src/jobs/store.js +102 -0
- package/dist/src/jobs/types.js +30 -0
- package/dist/src/jobs/worker.js +97 -0
- package/dist/src/learning/engine.js +356 -0
- package/dist/src/learning/index.js +9 -0
- package/dist/src/learning/locator-policy.js +120 -0
- package/dist/src/learning/pattern-policy.js +89 -0
- package/dist/src/learning/recovery-policy.js +116 -0
- package/dist/src/learning/sensor-policy.js +115 -0
- package/dist/src/learning/timing-model.js +204 -0
- package/dist/src/learning/topology-policy.js +90 -0
- package/dist/src/learning/types.js +9 -0
- package/dist/src/logging/timeline-logger.js +48 -0
- package/dist/src/mcp/mcp-stdio-server.js +464 -0
- package/dist/src/mcp/server.js +363 -0
- package/dist/src/mcp-entry.js +60 -0
- package/dist/src/memory/playbook-seeds.js +200 -0
- package/dist/src/memory/recall.js +222 -0
- package/dist/src/memory/research.js +104 -0
- package/dist/src/memory/seeds.js +101 -0
- package/dist/src/memory/service.js +446 -0
- package/dist/src/memory/session.js +169 -0
- package/dist/src/memory/store.js +451 -0
- package/{src/runtime/locator-cache.ts → dist/src/memory/types.js} +1 -17
- package/dist/src/monitor/codex-monitor.js +382 -0
- package/dist/src/monitor/task-queue.js +97 -0
- package/dist/src/monitor/types.js +62 -0
- package/dist/src/native/bridge-client.js +412 -0
- package/{src/native/macos-bridge-client.ts → dist/src/native/macos-bridge-client.js} +0 -1
- package/dist/src/observer/state.js +199 -0
- package/dist/src/observer/types.js +43 -0
- package/dist/src/orchestrator/state.js +68 -0
- package/dist/src/orchestrator/types.js +22 -0
- package/dist/src/perception/ax-source.js +162 -0
- package/dist/src/perception/cdp-source.js +162 -0
- package/dist/src/perception/coordinator.js +771 -0
- package/dist/src/perception/frame-differ.js +287 -0
- package/dist/src/perception/index.js +22 -0
- package/dist/src/perception/manager.js +199 -0
- package/dist/src/perception/types.js +47 -0
- package/dist/src/perception/vision-source.js +399 -0
- package/dist/src/planner/deterministic.js +298 -0
- package/dist/src/planner/executor.js +870 -0
- package/dist/src/planner/goal-store.js +92 -0
- package/dist/src/planner/index.js +21 -0
- package/dist/src/planner/planner.js +520 -0
- package/dist/src/planner/tool-registry.js +71 -0
- package/dist/src/planner/types.js +22 -0
- package/dist/src/platform/explorer.js +213 -0
- package/dist/src/platform/help-center-markdown.js +527 -0
- package/dist/src/platform/learner.js +257 -0
- package/dist/src/playbook/engine.js +486 -0
- package/dist/src/playbook/index.js +20 -0
- package/dist/src/playbook/mcp-recorder.js +204 -0
- package/dist/src/playbook/recorder.js +536 -0
- package/dist/src/playbook/runner.js +408 -0
- package/dist/src/playbook/store.js +312 -0
- package/dist/src/playbook/types.js +17 -0
- package/dist/src/recovery/detectors.js +156 -0
- package/dist/src/recovery/engine.js +327 -0
- package/dist/src/recovery/index.js +20 -0
- package/dist/src/recovery/strategies.js +274 -0
- package/dist/src/recovery/types.js +20 -0
- package/dist/src/runtime/accessibility-adapter.js +430 -0
- package/dist/src/runtime/app-adapter.js +64 -0
- package/dist/src/runtime/applescript-adapter.js +305 -0
- package/dist/src/runtime/ax-role-map.js +96 -0
- package/dist/src/runtime/browser-adapter.js +52 -0
- package/dist/src/runtime/cdp-chrome-adapter.js +521 -0
- package/dist/src/runtime/composite-adapter.js +221 -0
- package/dist/src/runtime/execution-contract.js +159 -0
- package/dist/src/runtime/executor.js +286 -0
- package/dist/src/runtime/locator-cache.js +50 -0
- package/dist/src/runtime/planning-loop.js +63 -0
- package/dist/src/runtime/service.js +432 -0
- package/dist/src/runtime/session-manager.js +63 -0
- package/dist/src/runtime/state-observer.js +121 -0
- package/dist/src/runtime/vision-adapter.js +225 -0
- package/dist/src/state/app-map-types.js +72 -0
- package/dist/src/state/app-map.js +1974 -0
- package/dist/src/state/entity-tracker.js +108 -0
- package/dist/src/state/fusion.js +96 -0
- package/dist/src/state/index.js +21 -0
- package/dist/src/state/ladder-generator.js +236 -0
- package/dist/src/state/persistence.js +156 -0
- package/dist/src/state/types.js +17 -0
- package/dist/src/state/world-model.js +1456 -0
- package/dist/src/supervisor/locks.js +186 -0
- package/dist/src/supervisor/supervisor.js +403 -0
- package/dist/src/supervisor/types.js +30 -0
- package/dist/src/test-mcp-protocol.js +154 -0
- package/dist/src/types.js +17 -0
- package/dist/src/util/atomic-write.js +133 -0
- package/dist/src/util/sanitize.js +146 -0
- package/dist-app-maps/com.figma.Desktop.json +959 -0
- package/dist-app-maps/com.hnc.Discord.json +1146 -0
- package/dist-app-maps/notion.id.json +2831 -0
- package/dist-playbooks/canva-screenhand-carousel.json +445 -0
- package/dist-playbooks/codex-desktop.json +76 -0
- package/dist-playbooks/competitor-research-stack.json +122 -0
- package/dist-playbooks/davinci-color-grade.json +153 -0
- package/dist-playbooks/davinci-edit-timeline.json +162 -0
- package/dist-playbooks/davinci-render.json +114 -0
- package/dist-playbooks/devto.json +52 -0
- package/dist-playbooks/discord.json +41 -0
- package/dist-playbooks/google-flow-create-project.json +59 -0
- package/dist-playbooks/google-flow-edit-image.json +90 -0
- package/dist-playbooks/google-flow-edit-video.json +90 -0
- package/dist-playbooks/google-flow-generate-image.json +68 -0
- package/dist-playbooks/google-flow-generate-video.json +191 -0
- package/dist-playbooks/google-flow-open-project.json +48 -0
- package/dist-playbooks/google-flow-open-scenebuilder.json +64 -0
- package/dist-playbooks/google-flow-search-assets.json +64 -0
- package/dist-playbooks/instagram.json +57 -0
- package/dist-playbooks/linkedin.json +52 -0
- package/dist-playbooks/n8n.json +43 -0
- package/dist-playbooks/reddit.json +52 -0
- package/dist-playbooks/threads.json +59 -0
- package/dist-playbooks/x-twitter.json +59 -0
- package/dist-playbooks/youtube.json +59 -0
- package/dist-references/canva.json +646 -0
- package/dist-references/codex-desktop.json +305 -0
- package/dist-references/davinci-resolve-keyboard.json +594 -0
- package/dist-references/davinci-resolve-menu-map.json +1139 -0
- package/dist-references/davinci-resolve-menus-batch1.json +116 -0
- package/dist-references/davinci-resolve-menus-batch2.json +372 -0
- package/dist-references/davinci-resolve-menus-batch3.json +330 -0
- package/dist-references/davinci-resolve-menus-batch4.json +297 -0
- package/dist-references/davinci-resolve-shortcuts.json +333 -0
- package/dist-references/devto.json +317 -0
- package/dist-references/discord.json +549 -0
- package/dist-references/figma.json +1186 -0
- package/dist-references/finder.json +146 -0
- package/dist-references/google-ads-transparency.json +95 -0
- package/dist-references/google-flow.json +649 -0
- package/dist-references/instagram.json +341 -0
- package/dist-references/linkedin.json +324 -0
- package/dist-references/meta-ad-library.json +86 -0
- package/dist-references/n8n.json +387 -0
- package/dist-references/notes.json +27 -0
- package/dist-references/notion.json +163 -0
- package/dist-references/reddit.json +341 -0
- package/dist-references/threads.json +337 -0
- package/dist-references/x-twitter.json +403 -0
- package/dist-references/youtube.json +373 -0
- package/native/macos-bridge/Package.swift +1 -0
- package/native/macos-bridge/Sources/AccessibilityBridge.swift +257 -36
- package/native/macos-bridge/Sources/AppManagement.swift +212 -2
- package/native/macos-bridge/Sources/CoreGraphicsBridge.swift +348 -53
- package/native/macos-bridge/Sources/StreamCapture.swift +136 -0
- package/native/macos-bridge/Sources/VisionBridge.swift +165 -7
- package/native/macos-bridge/Sources/main.swift +169 -16
- package/native/windows-bridge/Program.cs +5 -0
- package/native/windows-bridge/ScreenCapture.cs +124 -0
- package/package.json +29 -4
- package/scripts/postinstall.cjs +127 -0
- package/.claude/commands/automate.md +0 -28
- package/.claude/commands/debug-ui.md +0 -19
- package/.claude/commands/screenshot.md +0 -15
- package/.github/FUNDING.yml +0 -1
- package/.github/ISSUE_TEMPLATE/bug_report.md +0 -27
- package/.github/ISSUE_TEMPLATE/feature_request.md +0 -20
- package/.mcp.json +0 -8
- package/DESKTOP_MCP_GUIDE.md +0 -92
- package/SECURITY.md +0 -44
- package/docs/architecture.md +0 -47
- package/install-skills.sh +0 -19
- package/mcp-bridge.ts +0 -271
- package/mcp-desktop.ts +0 -1221
- package/playbooks/instagram.json +0 -41
- package/playbooks/instagram_v2.json +0 -201
- package/playbooks/x_v1.json +0 -211
- package/scripts/devpost-live-loop.mjs +0 -421
- package/src/logging/timeline-logger.ts +0 -55
- package/src/mcp/server.ts +0 -449
- package/src/memory/recall.ts +0 -191
- package/src/memory/research.ts +0 -146
- package/src/memory/seeds.ts +0 -123
- package/src/memory/session.ts +0 -201
- package/src/memory/store.ts +0 -434
- package/src/memory/types.ts +0 -69
- package/src/native/bridge-client.ts +0 -239
- package/src/runtime/accessibility-adapter.ts +0 -487
- package/src/runtime/app-adapter.ts +0 -169
- package/src/runtime/applescript-adapter.ts +0 -376
- package/src/runtime/ax-role-map.ts +0 -102
- package/src/runtime/browser-adapter.ts +0 -129
- package/src/runtime/cdp-chrome-adapter.ts +0 -676
- package/src/runtime/composite-adapter.ts +0 -274
- package/src/runtime/executor.ts +0 -396
- package/src/runtime/planning-loop.ts +0 -81
- package/src/runtime/service.ts +0 -448
- package/src/runtime/session-manager.ts +0 -50
- package/src/runtime/state-observer.ts +0 -136
- package/src/runtime/vision-adapter.ts +0 -297
- package/src/types.ts +0 -297
- package/tests/bridge-client.test.ts +0 -176
- package/tests/browser-stealth.test.ts +0 -210
- package/tests/composite-adapter.test.ts +0 -64
- package/tests/mcp-server.test.ts +0 -151
- package/tests/memory-recall.test.ts +0 -339
- package/tests/memory-research.test.ts +0 -159
- package/tests/memory-seeds.test.ts +0 -120
- package/tests/memory-store.test.ts +0 -392
- package/tests/types.test.ts +0 -92
- package/tsconfig.check.json +0 -17
- package/tsconfig.json +0 -19
- package/vitest.config.ts +0 -8
- /package/{playbooks → dist-references}/devpost.json +0 -0
|
@@ -1,81 +0,0 @@
|
|
|
1
|
-
// Copyright (C) 2025 Clazro Technology Private Limited
|
|
2
|
-
// SPDX-License-Identifier: AGPL-3.0-only
|
|
3
|
-
//
|
|
4
|
-
// This file is part of ScreenHand.
|
|
5
|
-
//
|
|
6
|
-
// ScreenHand is free software: you can redistribute it and/or modify
|
|
7
|
-
// it under the terms of the GNU Affero General Public License as
|
|
8
|
-
// published by the Free Software Foundation, version 3.
|
|
9
|
-
//
|
|
10
|
-
// ScreenHand is distributed in the hope that it will be useful,
|
|
11
|
-
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12
|
-
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13
|
-
// GNU Affero General Public License for more details.
|
|
14
|
-
//
|
|
15
|
-
// You should have received a copy of the GNU Affero General Public License
|
|
16
|
-
// along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
|
|
17
|
-
|
|
18
|
-
import type { AppContext, UIEvent } from "../types.js";
|
|
19
|
-
import type { StateObserver } from "./state-observer.js";
|
|
20
|
-
import type { AppAdapter } from "./app-adapter.js";
|
|
21
|
-
|
|
22
|
-
export interface StateSnapshot {
|
|
23
|
-
recentEvents: UIEvent[];
|
|
24
|
-
appContext: AppContext | null;
|
|
25
|
-
lastActionResult: unknown;
|
|
26
|
-
observing: boolean;
|
|
27
|
-
timestamp: string;
|
|
28
|
-
}
|
|
29
|
-
|
|
30
|
-
/**
|
|
31
|
-
* Bidirectional planning loop that buffers UI events between LLM actions
|
|
32
|
-
* and provides state snapshots for the LLM to react to.
|
|
33
|
-
*/
|
|
34
|
-
export class PlanningLoop {
|
|
35
|
-
private lastActionResults = new Map<string, unknown>();
|
|
36
|
-
|
|
37
|
-
constructor(
|
|
38
|
-
private readonly observer: StateObserver,
|
|
39
|
-
private readonly adapter: AppAdapter,
|
|
40
|
-
) {}
|
|
41
|
-
|
|
42
|
-
/** Get a state snapshot for the LLM after an action. */
|
|
43
|
-
async getStateSnapshot(sessionId: string): Promise<StateSnapshot> {
|
|
44
|
-
const recentEvents = this.observer.drainEvents();
|
|
45
|
-
|
|
46
|
-
let appContext: AppContext | null = null;
|
|
47
|
-
try {
|
|
48
|
-
appContext = await this.adapter.getAppContext(sessionId);
|
|
49
|
-
} catch {
|
|
50
|
-
// May not have an active session
|
|
51
|
-
}
|
|
52
|
-
|
|
53
|
-
return {
|
|
54
|
-
recentEvents,
|
|
55
|
-
appContext,
|
|
56
|
-
lastActionResult: this.lastActionResults.get(sessionId) ?? null,
|
|
57
|
-
observing: this.observer.isObserving,
|
|
58
|
-
timestamp: new Date().toISOString(),
|
|
59
|
-
};
|
|
60
|
-
}
|
|
61
|
-
|
|
62
|
-
/** Record the result of the last action for a session. */
|
|
63
|
-
recordActionResult(sessionId: string, result: unknown): void {
|
|
64
|
-
this.lastActionResults.set(sessionId, result);
|
|
65
|
-
}
|
|
66
|
-
|
|
67
|
-
/** Start observing a process for state changes. */
|
|
68
|
-
async startObserving(sessionId: string, pid: number): Promise<void> {
|
|
69
|
-
await this.observer.startObserving(pid);
|
|
70
|
-
}
|
|
71
|
-
|
|
72
|
-
/** Stop observing a process. */
|
|
73
|
-
async stopObserving(sessionId: string, pid: number): Promise<void> {
|
|
74
|
-
await this.observer.stopObserving(pid);
|
|
75
|
-
}
|
|
76
|
-
|
|
77
|
-
/** Peek at recent events without draining. */
|
|
78
|
-
peekEvents(limit = 50): UIEvent[] {
|
|
79
|
-
return this.observer.peekEvents(limit);
|
|
80
|
-
}
|
|
81
|
-
}
|
package/src/runtime/service.ts
DELETED
|
@@ -1,448 +0,0 @@
|
|
|
1
|
-
// Copyright (C) 2025 Clazro Technology Private Limited
|
|
2
|
-
// SPDX-License-Identifier: AGPL-3.0-only
|
|
3
|
-
//
|
|
4
|
-
// This file is part of ScreenHand.
|
|
5
|
-
//
|
|
6
|
-
// ScreenHand is free software: you can redistribute it and/or modify
|
|
7
|
-
// it under the terms of the GNU Affero General Public License as
|
|
8
|
-
// published by the Free Software Foundation, version 3.
|
|
9
|
-
//
|
|
10
|
-
// ScreenHand is distributed in the hope that it will be useful,
|
|
11
|
-
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12
|
-
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13
|
-
// GNU Affero General Public License for more details.
|
|
14
|
-
//
|
|
15
|
-
// You should have received a copy of the GNU Affero General Public License
|
|
16
|
-
// along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
|
|
17
|
-
|
|
18
|
-
import {
|
|
19
|
-
DEFAULT_NAVIGATE_TIMEOUT_MS,
|
|
20
|
-
DEFAULT_PROFILE,
|
|
21
|
-
DEFAULT_WAIT_TIMEOUT_MS,
|
|
22
|
-
} from "../config.js";
|
|
23
|
-
import type { TimelineLogger } from "../logging/timeline-logger.js";
|
|
24
|
-
import type {
|
|
25
|
-
AXNode,
|
|
26
|
-
AppContext,
|
|
27
|
-
AppFocusInput,
|
|
28
|
-
AppLaunchInput,
|
|
29
|
-
DragInput,
|
|
30
|
-
ElementTreeInput,
|
|
31
|
-
ExtractInput,
|
|
32
|
-
KeyComboInput,
|
|
33
|
-
MenuClickInput,
|
|
34
|
-
NavigateInput,
|
|
35
|
-
ObserveStartInput,
|
|
36
|
-
ObserveStopInput,
|
|
37
|
-
PageMeta,
|
|
38
|
-
PressInput,
|
|
39
|
-
RunningApp,
|
|
40
|
-
ScreenshotInput,
|
|
41
|
-
ScrollInput,
|
|
42
|
-
SessionInfo,
|
|
43
|
-
ToolResult,
|
|
44
|
-
TypeIntoInput,
|
|
45
|
-
WaitForInput,
|
|
46
|
-
WindowInfo,
|
|
47
|
-
} from "../types.js";
|
|
48
|
-
import type { AppAdapter } from "./app-adapter.js";
|
|
49
|
-
import { Executor } from "./executor.js";
|
|
50
|
-
import { LocatorCache } from "./locator-cache.js";
|
|
51
|
-
import { SessionManager } from "./session-manager.js";
|
|
52
|
-
|
|
53
|
-
export class AutomationRuntimeService {
|
|
54
|
-
private readonly sessions: SessionManager;
|
|
55
|
-
private readonly executor: Executor;
|
|
56
|
-
|
|
57
|
-
constructor(
|
|
58
|
-
private readonly adapter: AppAdapter,
|
|
59
|
-
private readonly logger: TimelineLogger,
|
|
60
|
-
cache = new LocatorCache(),
|
|
61
|
-
) {
|
|
62
|
-
this.sessions = new SessionManager(adapter);
|
|
63
|
-
this.executor = new Executor(adapter, cache, logger);
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
async sessionStart(profile = DEFAULT_PROFILE): Promise<SessionInfo> {
|
|
67
|
-
return this.sessions.sessionStart(profile);
|
|
68
|
-
}
|
|
69
|
-
|
|
70
|
-
async navigate(input: NavigateInput): Promise<ToolResult<PageMeta>> {
|
|
71
|
-
const telemetry = this.logger.start("navigate", input.sessionId);
|
|
72
|
-
try {
|
|
73
|
-
this.sessions.requireSession(input.sessionId);
|
|
74
|
-
const page = await this.adapter.navigate(
|
|
75
|
-
input.sessionId,
|
|
76
|
-
input.url,
|
|
77
|
-
input.timeoutMs ?? DEFAULT_NAVIGATE_TIMEOUT_MS,
|
|
78
|
-
);
|
|
79
|
-
return {
|
|
80
|
-
ok: true,
|
|
81
|
-
data: page,
|
|
82
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
83
|
-
};
|
|
84
|
-
} catch (error) {
|
|
85
|
-
return {
|
|
86
|
-
ok: false,
|
|
87
|
-
error: {
|
|
88
|
-
code: "ACTION_FAILED",
|
|
89
|
-
message: error instanceof Error ? error.message : "Navigate failed",
|
|
90
|
-
},
|
|
91
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
92
|
-
};
|
|
93
|
-
}
|
|
94
|
-
}
|
|
95
|
-
|
|
96
|
-
async waitFor(input: WaitForInput): Promise<ToolResult<{ matched: boolean }>> {
|
|
97
|
-
const telemetry = this.logger.start("wait_for", input.sessionId);
|
|
98
|
-
try {
|
|
99
|
-
this.sessions.requireSession(input.sessionId);
|
|
100
|
-
const matched = await this.adapter.waitFor(
|
|
101
|
-
input.sessionId,
|
|
102
|
-
input.condition,
|
|
103
|
-
input.timeoutMs ?? DEFAULT_WAIT_TIMEOUT_MS,
|
|
104
|
-
);
|
|
105
|
-
return {
|
|
106
|
-
ok: true,
|
|
107
|
-
data: { matched },
|
|
108
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
109
|
-
};
|
|
110
|
-
} catch (error) {
|
|
111
|
-
return {
|
|
112
|
-
ok: false,
|
|
113
|
-
error: {
|
|
114
|
-
code: "ACTION_FAILED",
|
|
115
|
-
message: error instanceof Error ? error.message : "Wait failed",
|
|
116
|
-
},
|
|
117
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
118
|
-
};
|
|
119
|
-
}
|
|
120
|
-
}
|
|
121
|
-
|
|
122
|
-
async press(input: PressInput): Promise<ToolResult<PageMeta>> {
|
|
123
|
-
this.sessions.requireSession(input.sessionId);
|
|
124
|
-
return this.executor.press(input);
|
|
125
|
-
}
|
|
126
|
-
|
|
127
|
-
async typeInto(input: TypeIntoInput): Promise<ToolResult<PageMeta>> {
|
|
128
|
-
this.sessions.requireSession(input.sessionId);
|
|
129
|
-
return this.executor.typeInto(input);
|
|
130
|
-
}
|
|
131
|
-
|
|
132
|
-
async extract(input: ExtractInput): Promise<ToolResult<unknown>> {
|
|
133
|
-
const telemetry = this.logger.start("extract", input.sessionId);
|
|
134
|
-
try {
|
|
135
|
-
this.sessions.requireSession(input.sessionId);
|
|
136
|
-
const data = await this.adapter.extract(
|
|
137
|
-
input.sessionId,
|
|
138
|
-
input.target,
|
|
139
|
-
input.format,
|
|
140
|
-
);
|
|
141
|
-
return {
|
|
142
|
-
ok: true,
|
|
143
|
-
data,
|
|
144
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
145
|
-
};
|
|
146
|
-
} catch (error) {
|
|
147
|
-
return {
|
|
148
|
-
ok: false,
|
|
149
|
-
error: {
|
|
150
|
-
code: "ACTION_FAILED",
|
|
151
|
-
message: error instanceof Error ? error.message : "Extract failed",
|
|
152
|
-
},
|
|
153
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
154
|
-
};
|
|
155
|
-
}
|
|
156
|
-
}
|
|
157
|
-
|
|
158
|
-
async screenshot(input: ScreenshotInput): Promise<ToolResult<{ path: string }>> {
|
|
159
|
-
const telemetry = this.logger.start("screenshot", input.sessionId);
|
|
160
|
-
try {
|
|
161
|
-
this.sessions.requireSession(input.sessionId);
|
|
162
|
-
const path = await this.adapter.screenshot(input.sessionId, input.region);
|
|
163
|
-
return {
|
|
164
|
-
ok: true,
|
|
165
|
-
data: { path },
|
|
166
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
167
|
-
};
|
|
168
|
-
} catch (error) {
|
|
169
|
-
return {
|
|
170
|
-
ok: false,
|
|
171
|
-
error: {
|
|
172
|
-
code: "ACTION_FAILED",
|
|
173
|
-
message: error instanceof Error ? error.message : "Screenshot failed",
|
|
174
|
-
},
|
|
175
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
176
|
-
};
|
|
177
|
-
}
|
|
178
|
-
}
|
|
179
|
-
|
|
180
|
-
// ── Desktop-specific methods ──
|
|
181
|
-
|
|
182
|
-
async appLaunch(input: AppLaunchInput): Promise<ToolResult<AppContext>> {
|
|
183
|
-
const telemetry = this.logger.start("app_launch", input.sessionId);
|
|
184
|
-
try {
|
|
185
|
-
this.sessions.requireSession(input.sessionId);
|
|
186
|
-
if (!this.adapter.launchApp) {
|
|
187
|
-
throw new Error("Adapter does not support launchApp");
|
|
188
|
-
}
|
|
189
|
-
const ctx = await this.adapter.launchApp(input.sessionId, input.bundleId);
|
|
190
|
-
return {
|
|
191
|
-
ok: true,
|
|
192
|
-
data: ctx,
|
|
193
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
194
|
-
};
|
|
195
|
-
} catch (error) {
|
|
196
|
-
return {
|
|
197
|
-
ok: false,
|
|
198
|
-
error: {
|
|
199
|
-
code: "ACTION_FAILED",
|
|
200
|
-
message: error instanceof Error ? error.message : "App launch failed",
|
|
201
|
-
},
|
|
202
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
203
|
-
};
|
|
204
|
-
}
|
|
205
|
-
}
|
|
206
|
-
|
|
207
|
-
async appFocus(input: AppFocusInput): Promise<ToolResult<void>> {
|
|
208
|
-
const telemetry = this.logger.start("app_focus", input.sessionId);
|
|
209
|
-
try {
|
|
210
|
-
this.sessions.requireSession(input.sessionId);
|
|
211
|
-
if (!this.adapter.focusApp) {
|
|
212
|
-
throw new Error("Adapter does not support focusApp");
|
|
213
|
-
}
|
|
214
|
-
await this.adapter.focusApp(input.sessionId, input.bundleId);
|
|
215
|
-
return {
|
|
216
|
-
ok: true,
|
|
217
|
-
data: undefined,
|
|
218
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
219
|
-
};
|
|
220
|
-
} catch (error) {
|
|
221
|
-
return {
|
|
222
|
-
ok: false,
|
|
223
|
-
error: {
|
|
224
|
-
code: "ACTION_FAILED",
|
|
225
|
-
message: error instanceof Error ? error.message : "App focus failed",
|
|
226
|
-
},
|
|
227
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
228
|
-
};
|
|
229
|
-
}
|
|
230
|
-
}
|
|
231
|
-
|
|
232
|
-
async appList(sessionId: string): Promise<ToolResult<RunningApp[]>> {
|
|
233
|
-
const telemetry = this.logger.start("app_list", sessionId);
|
|
234
|
-
try {
|
|
235
|
-
this.sessions.requireSession(sessionId);
|
|
236
|
-
if (!this.adapter.listApps) {
|
|
237
|
-
throw new Error("Adapter does not support listApps");
|
|
238
|
-
}
|
|
239
|
-
const apps = await this.adapter.listApps(sessionId);
|
|
240
|
-
return {
|
|
241
|
-
ok: true,
|
|
242
|
-
data: apps,
|
|
243
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
244
|
-
};
|
|
245
|
-
} catch (error) {
|
|
246
|
-
return {
|
|
247
|
-
ok: false,
|
|
248
|
-
error: {
|
|
249
|
-
code: "ACTION_FAILED",
|
|
250
|
-
message: error instanceof Error ? error.message : "App list failed",
|
|
251
|
-
},
|
|
252
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
253
|
-
};
|
|
254
|
-
}
|
|
255
|
-
}
|
|
256
|
-
|
|
257
|
-
async windowList(sessionId: string): Promise<ToolResult<WindowInfo[]>> {
|
|
258
|
-
const telemetry = this.logger.start("window_list", sessionId);
|
|
259
|
-
try {
|
|
260
|
-
this.sessions.requireSession(sessionId);
|
|
261
|
-
if (!this.adapter.listWindows) {
|
|
262
|
-
throw new Error("Adapter does not support listWindows");
|
|
263
|
-
}
|
|
264
|
-
const windows = await this.adapter.listWindows(sessionId);
|
|
265
|
-
return {
|
|
266
|
-
ok: true,
|
|
267
|
-
data: windows,
|
|
268
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
269
|
-
};
|
|
270
|
-
} catch (error) {
|
|
271
|
-
return {
|
|
272
|
-
ok: false,
|
|
273
|
-
error: {
|
|
274
|
-
code: "ACTION_FAILED",
|
|
275
|
-
message: error instanceof Error ? error.message : "Window list failed",
|
|
276
|
-
},
|
|
277
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
278
|
-
};
|
|
279
|
-
}
|
|
280
|
-
}
|
|
281
|
-
|
|
282
|
-
async menuClick(input: MenuClickInput): Promise<ToolResult<void>> {
|
|
283
|
-
const telemetry = this.logger.start("menu_click", input.sessionId);
|
|
284
|
-
try {
|
|
285
|
-
this.sessions.requireSession(input.sessionId);
|
|
286
|
-
if (!this.adapter.menuClick) {
|
|
287
|
-
throw new Error("Adapter does not support menuClick");
|
|
288
|
-
}
|
|
289
|
-
await this.adapter.menuClick(input.sessionId, input.menuPath);
|
|
290
|
-
return {
|
|
291
|
-
ok: true,
|
|
292
|
-
data: undefined,
|
|
293
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
294
|
-
};
|
|
295
|
-
} catch (error) {
|
|
296
|
-
return {
|
|
297
|
-
ok: false,
|
|
298
|
-
error: {
|
|
299
|
-
code: "ACTION_FAILED",
|
|
300
|
-
message: error instanceof Error ? error.message : "Menu click failed",
|
|
301
|
-
},
|
|
302
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
303
|
-
};
|
|
304
|
-
}
|
|
305
|
-
}
|
|
306
|
-
|
|
307
|
-
async keyCombo(input: KeyComboInput): Promise<ToolResult<void>> {
|
|
308
|
-
const telemetry = this.logger.start("key_combo", input.sessionId);
|
|
309
|
-
try {
|
|
310
|
-
this.sessions.requireSession(input.sessionId);
|
|
311
|
-
if (!this.adapter.keyCombo) {
|
|
312
|
-
throw new Error("Adapter does not support keyCombo");
|
|
313
|
-
}
|
|
314
|
-
await this.adapter.keyCombo(input.sessionId, input.keys);
|
|
315
|
-
return {
|
|
316
|
-
ok: true,
|
|
317
|
-
data: undefined,
|
|
318
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
319
|
-
};
|
|
320
|
-
} catch (error) {
|
|
321
|
-
return {
|
|
322
|
-
ok: false,
|
|
323
|
-
error: {
|
|
324
|
-
code: "ACTION_FAILED",
|
|
325
|
-
message: error instanceof Error ? error.message : "Key combo failed",
|
|
326
|
-
},
|
|
327
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
328
|
-
};
|
|
329
|
-
}
|
|
330
|
-
}
|
|
331
|
-
|
|
332
|
-
async elementTree(input: ElementTreeInput): Promise<ToolResult<AXNode>> {
|
|
333
|
-
const telemetry = this.logger.start("element_tree", input.sessionId);
|
|
334
|
-
try {
|
|
335
|
-
this.sessions.requireSession(input.sessionId);
|
|
336
|
-
if (!this.adapter.elementTree) {
|
|
337
|
-
throw new Error("Adapter does not support elementTree");
|
|
338
|
-
}
|
|
339
|
-
const tree = await this.adapter.elementTree(
|
|
340
|
-
input.sessionId,
|
|
341
|
-
input.maxDepth,
|
|
342
|
-
input.root,
|
|
343
|
-
);
|
|
344
|
-
return {
|
|
345
|
-
ok: true,
|
|
346
|
-
data: tree,
|
|
347
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
348
|
-
};
|
|
349
|
-
} catch (error) {
|
|
350
|
-
return {
|
|
351
|
-
ok: false,
|
|
352
|
-
error: {
|
|
353
|
-
code: "ACTION_FAILED",
|
|
354
|
-
message: error instanceof Error ? error.message : "Element tree failed",
|
|
355
|
-
},
|
|
356
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
357
|
-
};
|
|
358
|
-
}
|
|
359
|
-
}
|
|
360
|
-
|
|
361
|
-
async drag(input: DragInput): Promise<ToolResult<void>> {
|
|
362
|
-
const telemetry = this.logger.start("drag", input.sessionId);
|
|
363
|
-
try {
|
|
364
|
-
this.sessions.requireSession(input.sessionId);
|
|
365
|
-
if (!this.adapter.drag) {
|
|
366
|
-
throw new Error("Adapter does not support drag");
|
|
367
|
-
}
|
|
368
|
-
const fromEl = await this.adapter.locate(input.sessionId, input.from, 800);
|
|
369
|
-
const toEl = await this.adapter.locate(input.sessionId, input.to, 800);
|
|
370
|
-
if (!fromEl || !toEl) {
|
|
371
|
-
throw new Error("Could not locate drag source or destination");
|
|
372
|
-
}
|
|
373
|
-
await this.adapter.drag(input.sessionId, fromEl, toEl);
|
|
374
|
-
return {
|
|
375
|
-
ok: true,
|
|
376
|
-
data: undefined,
|
|
377
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
378
|
-
};
|
|
379
|
-
} catch (error) {
|
|
380
|
-
return {
|
|
381
|
-
ok: false,
|
|
382
|
-
error: {
|
|
383
|
-
code: "ACTION_FAILED",
|
|
384
|
-
message: error instanceof Error ? error.message : "Drag failed",
|
|
385
|
-
},
|
|
386
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
387
|
-
};
|
|
388
|
-
}
|
|
389
|
-
}
|
|
390
|
-
|
|
391
|
-
async scroll(input: ScrollInput): Promise<ToolResult<void>> {
|
|
392
|
-
const telemetry = this.logger.start("scroll", input.sessionId);
|
|
393
|
-
try {
|
|
394
|
-
this.sessions.requireSession(input.sessionId);
|
|
395
|
-
if (!this.adapter.scroll) {
|
|
396
|
-
throw new Error("Adapter does not support scroll");
|
|
397
|
-
}
|
|
398
|
-
let element: import("../types.js").LocatedElement | undefined;
|
|
399
|
-
if (input.target) {
|
|
400
|
-
const found = await this.adapter.locate(input.sessionId, input.target, 800);
|
|
401
|
-
if (found) element = found;
|
|
402
|
-
}
|
|
403
|
-
await this.adapter.scroll(
|
|
404
|
-
input.sessionId,
|
|
405
|
-
input.direction,
|
|
406
|
-
input.amount ?? 3,
|
|
407
|
-
element,
|
|
408
|
-
);
|
|
409
|
-
return {
|
|
410
|
-
ok: true,
|
|
411
|
-
data: undefined,
|
|
412
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
413
|
-
};
|
|
414
|
-
} catch (error) {
|
|
415
|
-
return {
|
|
416
|
-
ok: false,
|
|
417
|
-
error: {
|
|
418
|
-
code: "ACTION_FAILED",
|
|
419
|
-
message: error instanceof Error ? error.message : "Scroll failed",
|
|
420
|
-
},
|
|
421
|
-
telemetry: this.logger.finish(telemetry, "failed"),
|
|
422
|
-
};
|
|
423
|
-
}
|
|
424
|
-
}
|
|
425
|
-
|
|
426
|
-
async observeStart(_input: ObserveStartInput): Promise<ToolResult<void>> {
|
|
427
|
-
const telemetry = this.logger.start("observe_start", _input.sessionId);
|
|
428
|
-
// Implemented in Phase 4 when StateObserver is available
|
|
429
|
-
return {
|
|
430
|
-
ok: true,
|
|
431
|
-
data: undefined,
|
|
432
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
433
|
-
};
|
|
434
|
-
}
|
|
435
|
-
|
|
436
|
-
async observeStop(_input: ObserveStopInput): Promise<ToolResult<void>> {
|
|
437
|
-
const telemetry = this.logger.start("observe_stop", _input.sessionId);
|
|
438
|
-
return {
|
|
439
|
-
ok: true,
|
|
440
|
-
data: undefined,
|
|
441
|
-
telemetry: this.logger.finish(telemetry, "success"),
|
|
442
|
-
};
|
|
443
|
-
}
|
|
444
|
-
|
|
445
|
-
getTimeline(limit = 100) {
|
|
446
|
-
return this.logger.getRecent(limit);
|
|
447
|
-
}
|
|
448
|
-
}
|
|
@@ -1,50 +0,0 @@
|
|
|
1
|
-
// Copyright (C) 2025 Clazro Technology Private Limited
|
|
2
|
-
// SPDX-License-Identifier: AGPL-3.0-only
|
|
3
|
-
//
|
|
4
|
-
// This file is part of ScreenHand.
|
|
5
|
-
//
|
|
6
|
-
// ScreenHand is free software: you can redistribute it and/or modify
|
|
7
|
-
// it under the terms of the GNU Affero General Public License as
|
|
8
|
-
// published by the Free Software Foundation, version 3.
|
|
9
|
-
//
|
|
10
|
-
// ScreenHand is distributed in the hope that it will be useful,
|
|
11
|
-
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12
|
-
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13
|
-
// GNU Affero General Public License for more details.
|
|
14
|
-
//
|
|
15
|
-
// You should have received a copy of the GNU Affero General Public License
|
|
16
|
-
// along with ScreenHand. If not, see <https://www.gnu.org/licenses/>.
|
|
17
|
-
|
|
18
|
-
import type { AppAdapter } from "./app-adapter.js";
|
|
19
|
-
import type { SessionInfo } from "../types.js";
|
|
20
|
-
|
|
21
|
-
export class SessionManager {
|
|
22
|
-
private readonly sessionsByProfile = new Map<string, SessionInfo>();
|
|
23
|
-
private readonly sessionsById = new Map<string, SessionInfo>();
|
|
24
|
-
|
|
25
|
-
constructor(private readonly adapter: AppAdapter) {}
|
|
26
|
-
|
|
27
|
-
async sessionStart(profile: string): Promise<SessionInfo> {
|
|
28
|
-
const existing = this.sessionsByProfile.get(profile);
|
|
29
|
-
if (existing) {
|
|
30
|
-
return existing;
|
|
31
|
-
}
|
|
32
|
-
|
|
33
|
-
const created = await this.adapter.attach(profile);
|
|
34
|
-
this.sessionsByProfile.set(profile, created);
|
|
35
|
-
this.sessionsById.set(created.sessionId, created);
|
|
36
|
-
return created;
|
|
37
|
-
}
|
|
38
|
-
|
|
39
|
-
getSession(sessionId: string): SessionInfo | undefined {
|
|
40
|
-
return this.sessionsById.get(sessionId);
|
|
41
|
-
}
|
|
42
|
-
|
|
43
|
-
requireSession(sessionId: string): SessionInfo {
|
|
44
|
-
const session = this.getSession(sessionId);
|
|
45
|
-
if (!session) {
|
|
46
|
-
throw new Error(`Session not found: ${sessionId}`);
|
|
47
|
-
}
|
|
48
|
-
return session;
|
|
49
|
-
}
|
|
50
|
-
}
|