@praveencs/agent 0.9.30 → 0.10.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +55 -9
- package/ROADMAP.md +42 -50
- package/agent-skills/README.md +192 -0
- package/agent-skills/plugins/aws/plugin.json +22 -0
- package/agent-skills/plugins/aws/skills/aws-manager.md +17 -0
- package/agent-skills/plugins/aws/tools/aws.js +152 -0
- package/agent-skills/plugins/discord/plugin.json +22 -0
- package/agent-skills/plugins/discord/skills/discord-manager.md +15 -0
- package/agent-skills/plugins/discord/tools/discord.js +150 -0
- package/agent-skills/plugins/docker/plugin.json +21 -0
- package/agent-skills/plugins/docker/skills/docker-manager.md +15 -0
- package/agent-skills/plugins/docker/tools/docker.js +135 -0
- package/agent-skills/plugins/firebase/plugin.json +22 -0
- package/agent-skills/plugins/firebase/skills/firebase-manager.md +14 -0
- package/agent-skills/plugins/firebase/tools/firebase.js +157 -0
- package/agent-skills/plugins/github/plugin.json +23 -0
- package/agent-skills/plugins/github/skills/github-manager.md +15 -0
- package/agent-skills/plugins/github/tools/github.js +133 -0
- package/agent-skills/plugins/huggingface/plugin.json +22 -0
- package/agent-skills/plugins/huggingface/skills/huggingface-manager.md +16 -0
- package/agent-skills/plugins/huggingface/tools/huggingface.js +149 -0
- package/agent-skills/plugins/linear/plugin.json +22 -0
- package/agent-skills/plugins/linear/skills/linear-manager.md +16 -0
- package/agent-skills/plugins/linear/tools/linear.js +199 -0
- package/agent-skills/plugins/mongodb/plugin.json +21 -0
- package/agent-skills/plugins/mongodb/skills/mongodb-manager.md +14 -0
- package/agent-skills/plugins/mongodb/tools/mongodb.js +123 -0
- package/agent-skills/plugins/notion/plugin.json +22 -0
- package/agent-skills/plugins/notion/skills/notion-manager.md +16 -0
- package/agent-skills/plugins/notion/tools/notion.js +158 -0
- package/agent-skills/plugins/openai/plugin.json +23 -0
- package/agent-skills/plugins/openai/skills/openai-manager.md +15 -0
- package/agent-skills/plugins/openai/tools/openai.js +137 -0
- package/agent-skills/plugins/resend/plugin.json +21 -0
- package/agent-skills/plugins/resend/skills/resend-manager.md +15 -0
- package/agent-skills/plugins/resend/tools/resend.js +102 -0
- package/agent-skills/plugins/slack/plugin.json +22 -0
- package/agent-skills/plugins/slack/skills/slack-manager.md +15 -0
- package/agent-skills/plugins/slack/tools/slack.js +168 -0
- package/agent-skills/plugins/stripe/plugin.json +22 -0
- package/agent-skills/plugins/stripe/skills/stripe-manager.md +16 -0
- package/agent-skills/plugins/stripe/tools/stripe.js +174 -0
- package/agent-skills/plugins/supabase/plugin.json +22 -0
- package/agent-skills/plugins/supabase/skills/supabase-manager.md +16 -0
- package/agent-skills/plugins/supabase/tools/supabase.js +153 -0
- package/agent-skills/plugins/telegram/plugin.json +21 -0
- package/agent-skills/plugins/telegram/skills/telegram-manager.md +14 -0
- package/agent-skills/plugins/telegram/tools/telegram.js +131 -0
- package/agent-skills/plugins/vercel/plugin.json +22 -0
- package/agent-skills/plugins/vercel/skills/vercel-manager.md +15 -0
- package/agent-skills/plugins/vercel/tools/vercel.js +145 -0
- package/agent-skills/registry.json +675 -0
- package/agent-skills/skills/api-tester/prompt.md +27 -0
- package/agent-skills/skills/api-tester/skill.json +16 -0
- package/agent-skills/skills/backup/prompt.md +12 -0
- package/agent-skills/skills/backup/skill.json +1 -0
- package/agent-skills/skills/code-review/prompt.md +29 -0
- package/agent-skills/skills/code-review/skill.json +18 -0
- package/agent-skills/skills/create-note/prompt.md +21 -0
- package/agent-skills/skills/create-note/skill.json +15 -0
- package/agent-skills/skills/cron-scheduler/prompt.md +25 -0
- package/agent-skills/skills/cron-scheduler/skill.json +1 -0
- package/agent-skills/skills/db-query/prompt.md +12 -0
- package/agent-skills/skills/db-query/skill.json +1 -0
- package/agent-skills/skills/docker-deploy/prompt.md +21 -0
- package/agent-skills/skills/docker-deploy/skill.json +16 -0
- package/agent-skills/skills/file-organizer/prompt.md +32 -0
- package/agent-skills/skills/file-organizer/skill.json +19 -0
- package/agent-skills/skills/git-commit/prompt.md +21 -0
- package/agent-skills/skills/git-commit/skill.json +17 -0
- package/agent-skills/skills/log-analyzer/prompt.md +16 -0
- package/agent-skills/skills/log-analyzer/skill.json +1 -0
- package/agent-skills/skills/npm-publish/prompt.md +24 -0
- package/agent-skills/skills/npm-publish/skill.json +20 -0
- package/agent-skills/skills/open-vscode/prompt.md +8 -0
- package/agent-skills/skills/open-vscode/skill.json +15 -0
- package/agent-skills/skills/project-scaffold/prompt.md +43 -0
- package/agent-skills/skills/project-scaffold/skill.json +17 -0
- package/agent-skills/skills/send-email/prompt.md +19 -0
- package/agent-skills/skills/send-email/send.js +60 -0
- package/agent-skills/skills/send-email/skill.json +16 -0
- package/agent-skills/skills/system-monitor/prompt.md +27 -0
- package/agent-skills/skills/system-monitor/skill.json +15 -0
- package/agent-skills/skills/web-search/prompt.md +26 -0
- package/agent-skills/skills/web-search/skill.json +16 -0
- package/dist/src/cli/commands/desktop.d.ts +3 -0
- package/dist/src/cli/commands/desktop.d.ts.map +1 -0
- package/dist/src/cli/commands/desktop.js +80 -0
- package/dist/src/cli/commands/desktop.js.map +1 -0
- package/dist/src/cli/commands/multimodal.d.ts +3 -0
- package/dist/src/cli/commands/multimodal.d.ts.map +1 -0
- package/dist/src/cli/commands/multimodal.js +78 -0
- package/dist/src/cli/commands/multimodal.js.map +1 -0
- package/dist/src/cli/commands/sandbox.d.ts +3 -0
- package/dist/src/cli/commands/sandbox.d.ts.map +1 -0
- package/dist/src/cli/commands/sandbox.js +89 -0
- package/dist/src/cli/commands/sandbox.js.map +1 -0
- package/dist/src/cli/commands/swarm.d.ts +3 -0
- package/dist/src/cli/commands/swarm.d.ts.map +1 -0
- package/dist/src/cli/commands/swarm.js +120 -0
- package/dist/src/cli/commands/swarm.js.map +1 -0
- package/dist/src/cli/index.d.ts.map +1 -1
- package/dist/src/cli/index.js +8 -0
- package/dist/src/cli/index.js.map +1 -1
- package/dist/src/config/defaults.d.ts.map +1 -1
- package/dist/src/config/defaults.js +42 -0
- package/dist/src/config/defaults.js.map +1 -1
- package/dist/src/config/schema.d.ts +261 -0
- package/dist/src/config/schema.d.ts.map +1 -1
- package/dist/src/config/schema.js +58 -0
- package/dist/src/config/schema.js.map +1 -1
- package/dist/src/desktop/engine.d.ts +42 -0
- package/dist/src/desktop/engine.d.ts.map +1 -0
- package/dist/src/desktop/engine.js +77 -0
- package/dist/src/desktop/engine.js.map +1 -0
- package/dist/src/desktop/index.d.ts +6 -0
- package/dist/src/desktop/index.d.ts.map +1 -0
- package/dist/src/desktop/index.js +6 -0
- package/dist/src/desktop/index.js.map +1 -0
- package/dist/src/desktop/input.d.ts +20 -0
- package/dist/src/desktop/input.d.ts.map +1 -0
- package/dist/src/desktop/input.js +160 -0
- package/dist/src/desktop/input.js.map +1 -0
- package/dist/src/desktop/screen.d.ts +17 -0
- package/dist/src/desktop/screen.d.ts.map +1 -0
- package/dist/src/desktop/screen.js +120 -0
- package/dist/src/desktop/screen.js.map +1 -0
- package/dist/src/desktop/types.d.ts +50 -0
- package/dist/src/desktop/types.d.ts.map +1 -0
- package/dist/src/desktop/types.js +10 -0
- package/dist/src/desktop/types.js.map +1 -0
- package/dist/src/multimodal/engine.d.ts +33 -0
- package/dist/src/multimodal/engine.d.ts.map +1 -0
- package/dist/src/multimodal/engine.js +63 -0
- package/dist/src/multimodal/engine.js.map +1 -0
- package/dist/src/multimodal/index.d.ts +7 -0
- package/dist/src/multimodal/index.d.ts.map +1 -0
- package/dist/src/multimodal/index.js +7 -0
- package/dist/src/multimodal/index.js.map +1 -0
- package/dist/src/multimodal/tts.d.ts +11 -0
- package/dist/src/multimodal/tts.d.ts.map +1 -0
- package/dist/src/multimodal/tts.js +48 -0
- package/dist/src/multimodal/tts.js.map +1 -0
- package/dist/src/multimodal/types.d.ts +55 -0
- package/dist/src/multimodal/types.d.ts.map +1 -0
- package/dist/src/multimodal/types.js +20 -0
- package/dist/src/multimodal/types.js.map +1 -0
- package/dist/src/multimodal/vision.d.ts +15 -0
- package/dist/src/multimodal/vision.d.ts.map +1 -0
- package/dist/src/multimodal/vision.js +98 -0
- package/dist/src/multimodal/vision.js.map +1 -0
- package/dist/src/multimodal/voice.d.ts +11 -0
- package/dist/src/multimodal/voice.d.ts.map +1 -0
- package/dist/src/multimodal/voice.js +43 -0
- package/dist/src/multimodal/voice.js.map +1 -0
- package/dist/src/plans/types.d.ts +18 -18
- package/dist/src/sandbox/docker.d.ts +42 -0
- package/dist/src/sandbox/docker.d.ts.map +1 -0
- package/dist/src/sandbox/docker.js +131 -0
- package/dist/src/sandbox/docker.js.map +1 -0
- package/dist/src/sandbox/engine.d.ts +50 -0
- package/dist/src/sandbox/engine.d.ts.map +1 -0
- package/dist/src/sandbox/engine.js +133 -0
- package/dist/src/sandbox/engine.js.map +1 -0
- package/dist/src/sandbox/index.d.ts +5 -0
- package/dist/src/sandbox/index.d.ts.map +1 -0
- package/dist/src/sandbox/index.js +5 -0
- package/dist/src/sandbox/index.js.map +1 -0
- package/dist/src/sandbox/types.d.ts +41 -0
- package/dist/src/sandbox/types.d.ts.map +1 -0
- package/dist/src/sandbox/types.js +12 -0
- package/dist/src/sandbox/types.js.map +1 -0
- package/dist/src/scripts/types.d.ts +2 -2
- package/dist/src/server/app.d.ts.map +1 -1
- package/dist/src/server/app.js +133 -0
- package/dist/src/server/app.js.map +1 -1
- package/dist/src/swarm/bus.d.ts +27 -0
- package/dist/src/swarm/bus.d.ts.map +1 -0
- package/dist/src/swarm/bus.js +64 -0
- package/dist/src/swarm/bus.js.map +1 -0
- package/dist/src/swarm/index.d.ts +6 -0
- package/dist/src/swarm/index.d.ts.map +1 -0
- package/dist/src/swarm/index.js +6 -0
- package/dist/src/swarm/index.js.map +1 -0
- package/dist/src/swarm/orchestrator.d.ts +79 -0
- package/dist/src/swarm/orchestrator.d.ts.map +1 -0
- package/dist/src/swarm/orchestrator.js +271 -0
- package/dist/src/swarm/orchestrator.js.map +1 -0
- package/dist/src/swarm/roles.d.ts +18 -0
- package/dist/src/swarm/roles.d.ts.map +1 -0
- package/dist/src/swarm/roles.js +83 -0
- package/dist/src/swarm/roles.js.map +1 -0
- package/dist/src/swarm/types.d.ts +58 -0
- package/dist/src/swarm/types.d.ts.map +1 -0
- package/dist/src/swarm/types.js +10 -0
- package/dist/src/swarm/types.js.map +1 -0
- package/dist/src/tools/core/cmd.d.ts.map +1 -1
- package/dist/src/tools/core/cmd.js +28 -0
- package/dist/src/tools/core/cmd.js.map +1 -1
- package/docs/DOCUMENTATION.md +137 -0
- package/package.json +3 -1
- package/studio/README.md +73 -0
- package/studio/eslint.config.js +23 -0
- package/studio/index.html +13 -0
- package/studio/package-lock.json +4350 -0
- package/studio/package.json +44 -0
- package/studio/postcss.config.js +6 -0
- package/studio/public/vite.svg +1 -0
- package/studio/src/App.tsx +243 -0
- package/studio/src/assets/react.svg +1 -0
- package/studio/src/components/Capabilities.tsx +80 -0
- package/studio/src/components/CommandsManager.tsx +94 -0
- package/studio/src/components/CostDashboard.tsx +182 -0
- package/studio/src/components/CredentialCapture.tsx +196 -0
- package/studio/src/components/CredentialsManager.tsx +257 -0
- package/studio/src/components/DaemonPanel.tsx +91 -0
- package/studio/src/components/DesktopPanel.tsx +118 -0
- package/studio/src/components/GoalTemplates.tsx +190 -0
- package/studio/src/components/GoalsPanel.tsx +235 -0
- package/studio/src/components/MemoryExplorer.tsx +152 -0
- package/studio/src/components/MultimodalPanel.tsx +150 -0
- package/studio/src/components/NotificationsPanel.tsx +175 -0
- package/studio/src/components/PluginsManager.tsx +60 -0
- package/studio/src/components/SandboxPanel.tsx +118 -0
- package/studio/src/components/ScriptsManager.tsx +269 -0
- package/studio/src/components/SkillsManager.tsx +123 -0
- package/studio/src/components/SwarmPanel.tsx +149 -0
- package/studio/src/components/TaskStreaming.tsx +189 -0
- package/studio/src/components/Terminal.tsx +200 -0
- package/studio/src/index.css +51 -0
- package/studio/src/main.tsx +13 -0
- package/studio/tailwind.config.js +47 -0
- package/studio/tsconfig.app.json +28 -0
- package/studio/tsconfig.json +7 -0
- package/studio/tsconfig.node.json +26 -0
- package/studio/vite.config.ts +7 -0
|
@@ -0,0 +1,160 @@
|
|
|
1
|
+
// ─── Input Controller ───
|
|
2
|
+
// Simulates mouse and keyboard input using platform-native CLI tools.
|
|
3
|
+
import { execFile } from 'node:child_process';
|
|
4
|
+
import { promisify } from 'node:util';
|
|
5
|
+
const execFileAsync = promisify(execFile);
|
|
6
|
+
export class InputController {
|
|
7
|
+
delay;
|
|
8
|
+
constructor(actionDelay = 100) {
|
|
9
|
+
this.delay = actionDelay;
|
|
10
|
+
}
|
|
11
|
+
/**
|
|
12
|
+
* Execute a mouse action.
|
|
13
|
+
*/
|
|
14
|
+
async mouse(action) {
|
|
15
|
+
const platform = process.platform;
|
|
16
|
+
try {
|
|
17
|
+
if (platform === 'linux') {
|
|
18
|
+
await this.mouseLinux(action);
|
|
19
|
+
}
|
|
20
|
+
else if (platform === 'darwin') {
|
|
21
|
+
await this.mouseMac(action);
|
|
22
|
+
}
|
|
23
|
+
else {
|
|
24
|
+
throw new Error(`Mouse control not supported on ${platform} yet.`);
|
|
25
|
+
}
|
|
26
|
+
await this.sleep(this.delay);
|
|
27
|
+
return { success: true, action: `mouse.${action.type}` };
|
|
28
|
+
}
|
|
29
|
+
catch (err) {
|
|
30
|
+
return { success: false, action: `mouse.${action.type}`, error: err.message };
|
|
31
|
+
}
|
|
32
|
+
}
|
|
33
|
+
/**
|
|
34
|
+
* Execute a keyboard action.
|
|
35
|
+
*/
|
|
36
|
+
async keyboard(action) {
|
|
37
|
+
const platform = process.platform;
|
|
38
|
+
try {
|
|
39
|
+
if (platform === 'linux') {
|
|
40
|
+
await this.keyboardLinux(action);
|
|
41
|
+
}
|
|
42
|
+
else if (platform === 'darwin') {
|
|
43
|
+
await this.keyboardMac(action);
|
|
44
|
+
}
|
|
45
|
+
else {
|
|
46
|
+
throw new Error(`Keyboard control not supported on ${platform} yet.`);
|
|
47
|
+
}
|
|
48
|
+
await this.sleep(this.delay);
|
|
49
|
+
return { success: true, action: `keyboard.${action.type}` };
|
|
50
|
+
}
|
|
51
|
+
catch (err) {
|
|
52
|
+
return { success: false, action: `keyboard.${action.type}`, error: err.message };
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
// ─── Linux (xdotool) ───
|
|
56
|
+
async mouseLinux(action) {
|
|
57
|
+
switch (action.type) {
|
|
58
|
+
case 'move':
|
|
59
|
+
await execFileAsync('xdotool', ['mousemove', String(action.x || 0), String(action.y || 0)]);
|
|
60
|
+
break;
|
|
61
|
+
case 'click':
|
|
62
|
+
if (action.x !== undefined && action.y !== undefined) {
|
|
63
|
+
await execFileAsync('xdotool', ['mousemove', String(action.x), String(action.y)]);
|
|
64
|
+
}
|
|
65
|
+
await execFileAsync('xdotool', ['click', action.button === 'right' ? '3' : '1']);
|
|
66
|
+
break;
|
|
67
|
+
case 'doubleClick':
|
|
68
|
+
if (action.x !== undefined && action.y !== undefined) {
|
|
69
|
+
await execFileAsync('xdotool', ['mousemove', String(action.x), String(action.y)]);
|
|
70
|
+
}
|
|
71
|
+
await execFileAsync('xdotool', ['click', '--repeat', '2', '1']);
|
|
72
|
+
break;
|
|
73
|
+
case 'rightClick':
|
|
74
|
+
if (action.x !== undefined && action.y !== undefined) {
|
|
75
|
+
await execFileAsync('xdotool', ['mousemove', String(action.x), String(action.y)]);
|
|
76
|
+
}
|
|
77
|
+
await execFileAsync('xdotool', ['click', '3']);
|
|
78
|
+
break;
|
|
79
|
+
case 'scroll':
|
|
80
|
+
await execFileAsync('xdotool', ['click', (action.scrollAmount || 0) > 0 ? '5' : '4']);
|
|
81
|
+
break;
|
|
82
|
+
case 'drag':
|
|
83
|
+
await execFileAsync('xdotool', [
|
|
84
|
+
'mousemove', String(action.x || 0), String(action.y || 0),
|
|
85
|
+
'mousedown', '1',
|
|
86
|
+
'mousemove', String(action.toX || 0), String(action.toY || 0),
|
|
87
|
+
'mouseup', '1',
|
|
88
|
+
]);
|
|
89
|
+
break;
|
|
90
|
+
}
|
|
91
|
+
}
|
|
92
|
+
async keyboardLinux(action) {
|
|
93
|
+
switch (action.type) {
|
|
94
|
+
case 'type':
|
|
95
|
+
await execFileAsync('xdotool', ['type', '--clearmodifiers', action.text || '']);
|
|
96
|
+
break;
|
|
97
|
+
case 'press':
|
|
98
|
+
await execFileAsync('xdotool', ['key', action.key || '']);
|
|
99
|
+
break;
|
|
100
|
+
case 'hotkey': {
|
|
101
|
+
const combo = [...(action.modifiers || []), action.key || ''].join('+');
|
|
102
|
+
await execFileAsync('xdotool', ['key', combo]);
|
|
103
|
+
break;
|
|
104
|
+
}
|
|
105
|
+
}
|
|
106
|
+
}
|
|
107
|
+
// ─── macOS (osascript / cliclick) ───
|
|
108
|
+
async mouseMac(action) {
|
|
109
|
+
switch (action.type) {
|
|
110
|
+
case 'click':
|
|
111
|
+
await execFileAsync('osascript', ['-e',
|
|
112
|
+
`tell application "System Events" to click at {${action.x || 0}, ${action.y || 0}}`
|
|
113
|
+
]);
|
|
114
|
+
break;
|
|
115
|
+
case 'move':
|
|
116
|
+
// Use cliclick if available, else AppleScript
|
|
117
|
+
try {
|
|
118
|
+
await execFileAsync('cliclick', [`m:${action.x || 0},${action.y || 0}`]);
|
|
119
|
+
}
|
|
120
|
+
catch {
|
|
121
|
+
// Fallback: mouse move isn't natively easy on macOS without cliclick
|
|
122
|
+
}
|
|
123
|
+
break;
|
|
124
|
+
default:
|
|
125
|
+
throw new Error(`Mouse action ${action.type} requires cliclick on macOS`);
|
|
126
|
+
}
|
|
127
|
+
}
|
|
128
|
+
async keyboardMac(action) {
|
|
129
|
+
switch (action.type) {
|
|
130
|
+
case 'type':
|
|
131
|
+
await execFileAsync('osascript', ['-e',
|
|
132
|
+
`tell application "System Events" to keystroke "${(action.text || '').replace(/"/g, '\\"')}"`
|
|
133
|
+
]);
|
|
134
|
+
break;
|
|
135
|
+
case 'press':
|
|
136
|
+
await execFileAsync('osascript', ['-e',
|
|
137
|
+
`tell application "System Events" to key code ${this.macKeyCode(action.key || '')}`
|
|
138
|
+
]);
|
|
139
|
+
break;
|
|
140
|
+
case 'hotkey': {
|
|
141
|
+
const mods = (action.modifiers || []).map(m => m === 'ctrl' ? 'control down' : m === 'alt' ? 'option down' : m === 'meta' ? 'command down' : `${m} down`).join(', ');
|
|
142
|
+
await execFileAsync('osascript', ['-e',
|
|
143
|
+
`tell application "System Events" to keystroke "${action.key}" using {${mods}}`
|
|
144
|
+
]);
|
|
145
|
+
break;
|
|
146
|
+
}
|
|
147
|
+
}
|
|
148
|
+
}
|
|
149
|
+
macKeyCode(key) {
|
|
150
|
+
const codes = {
|
|
151
|
+
'Return': 36, 'Tab': 48, 'Escape': 53, 'Space': 49,
|
|
152
|
+
'Delete': 51, 'Up': 126, 'Down': 125, 'Left': 123, 'Right': 124,
|
|
153
|
+
};
|
|
154
|
+
return String(codes[key] || 0);
|
|
155
|
+
}
|
|
156
|
+
sleep(ms) {
|
|
157
|
+
return new Promise(resolve => setTimeout(resolve, ms));
|
|
158
|
+
}
|
|
159
|
+
}
|
|
160
|
+
//# sourceMappingURL=input.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"input.js","sourceRoot":"","sources":["../../../src/desktop/input.ts"],"names":[],"mappings":"AAAA,2BAA2B;AAC3B,sEAAsE;AAEtE,OAAO,EAAE,QAAQ,EAAE,MAAM,oBAAoB,CAAC;AAC9C,OAAO,EAAE,SAAS,EAAE,MAAM,WAAW,CAAC;AAGtC,MAAM,aAAa,GAAG,SAAS,CAAC,QAAQ,CAAC,CAAC;AAE1C,MAAM,OAAO,eAAe;IAChB,KAAK,CAAS;IAEtB,YAAY,cAAsB,GAAG;QACjC,IAAI,CAAC,KAAK,GAAG,WAAW,CAAC;IAC7B,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,KAAK,CAAC,MAAmB;QAC3B,MAAM,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QAElC,IAAI,CAAC;YACD,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;gBACvB,MAAM,IAAI,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC;YAClC,CAAC;iBAAM,IAAI,QAAQ,KAAK,QAAQ,EAAE,CAAC;gBAC/B,MAAM,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAChC,CAAC;iBAAM,CAAC;gBACJ,MAAM,IAAI,KAAK,CAAC,kCAAkC,QAAQ,OAAO,CAAC,CAAC;YACvE,CAAC;YAED,MAAM,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YAC7B,OAAO,EAAE,OAAO,EAAE,IAAI,EAAE,MAAM,EAAE,SAAS,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;QAC7D,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,OAAO,EAAE,OAAO,EAAE,KAAK,EAAE,MAAM,EAAE,SAAS,MAAM,CAAC,IAAI,EAAE,EAAE,KAAK,EAAG,GAAa,CAAC,OAAO,EAAE,CAAC;QAC7F,CAAC;IACL,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,QAAQ,CAAC,MAAsB;QACjC,MAAM,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QAElC,IAAI,CAAC;YACD,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;gBACvB,MAAM,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;YACrC,CAAC;iBAAM,IAAI,QAAQ,KAAK,QAAQ,EAAE,CAAC;gBAC/B,MAAM,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;YACnC,CAAC;iBAAM,CAAC;gBACJ,MAAM,IAAI,KAAK,CAAC,qCAAqC,QAAQ,OAAO,CAAC,CAAC;YAC1E,CAAC;YAED,MAAM,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YAC7B,OAAO,EAAE,OAAO,EAAE,IAAI,EAAE,MAAM,EAAE,YAAY,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;QAChE,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,OAAO,EAAE,OAAO,EAAE,KAAK,EAAE,MAAM,EAAE,YAAY,MAAM,CAAC,IAAI,EAAE,EAAE,KAAK,EAAG,GAAa,CAAC,OAAO,EAAE,CAAC;QAChG,CAAC;IACL,CAAC;IAED,0BAA0B;IAElB,KAAK,CAAC,UAAU,CAAC,MAAmB;QACxC,QAAQ,MAAM,CAAC,IAAI,EAAE,CAAC;YAClB,KAAK,MAAM;gBACP,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,WAAW,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,CAAC,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC;gBAC5F,MAAM;YACV,KAAK,OAAO;gBACR,IAAI,MAAM,CAAC,CAAC,KAAK,SAAS,IAAI,MAAM,CAAC,CAAC,KAAK,SAAS,EAAE,CAAC;oBACnD,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,WAAW,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;gBACtF,CAAC;gBACD,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,OAAO,EAAE,MAAM,CAAC,MAAM,KAAK,OAAO,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;gBACjF,MAAM;YACV,KAAK,aAAa;gBACd,IAAI,MAAM,CAAC,CAAC,KAAK,SAAS,IAAI,MAAM,CAAC,CAAC,KAAK,SAAS,EAAE,CAAC;oBACnD,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,WAAW,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;gBACtF,CAAC;gBACD,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,OAAO,EAAE,UAAU,EAAE,GAAG,EAAE,GAAG,CAAC,CAAC,CAAC;gBAChE,MAAM;YACV,KAAK,YAAY;gBACb,IAAI,MAAM,CAAC,CAAC,KAAK,SAAS,IAAI,MAAM,CAAC,CAAC,KAAK,SAAS,EAAE,CAAC;oBACnD,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,WAAW,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;gBACtF,CAAC;gBACD,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,OAAO,EAAE,GAAG,CAAC,CAAC,CAAC;gBAC/C,MAAM;YACV,KAAK,QAAQ;gBACT,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,OAAO,EAAE,CAAC,MAAM,CAAC,YAAY,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;gBACtF,MAAM;YACV,KAAK,MAAM;gBACP,MAAM,aAAa,CAAC,SAAS,EAAE;oBAC3B,WAAW,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,CAAC,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,CAAC;oBACzD,WAAW,EAAE,GAAG;oBAChB,WAAW,EAAE,MAAM,CAAC,MAAM,CAAC,GAAG,IAAI,CAAC,CAAC,EAAE,MAAM,CAAC,MAAM,CAAC,GAAG,IAAI,CAAC,CAAC;oBAC7D,SAAS,EAAE,GAAG;iBACjB,CAAC,CAAC;gBACH,MAAM;QACd,CAAC;IACL,CAAC;IAEO,KAAK,CAAC,aAAa,CAAC,MAAsB;QAC9C,QAAQ,MAAM,CAAC,IAAI,EAAE,CAAC;YAClB,KAAK,MAAM;gBACP,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,MAAM,EAAE,kBAAkB,EAAE,MAAM,CAAC,IAAI,IAAI,EAAE,CAAC,CAAC,CAAC;gBAChF,MAAM;YACV,KAAK,OAAO;gBACR,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,KAAK,EAAE,MAAM,CAAC,GAAG,IAAI,EAAE,CAAC,CAAC,CAAC;gBAC1D,MAAM;YACV,KAAK,QAAQ,CAAC,CAAC,CAAC;gBACZ,MAAM,KAAK,GAAG,CAAC,GAAG,CAAC,MAAM,CAAC,SAAS,IAAI,EAAE,CAAC,EAAE,MAAM,CAAC,GAAG,IAAI,EAAE,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;gBACxE,MAAM,aAAa,CAAC,SAAS,EAAE,CAAC,KAAK,EAAE,KAAK,CAAC,CAAC,CAAC;gBAC/C,MAAM;YACV,CAAC;QACL,CAAC;IACL,CAAC;IAED,uCAAuC;IAE/B,KAAK,CAAC,QAAQ,CAAC,MAAmB;QACtC,QAAQ,MAAM,CAAC,IAAI,EAAE,CAAC;YAClB,KAAK,OAAO;gBACR,MAAM,aAAa,CAAC,WAAW,EAAE,CAAC,IAAI;oBAClC,iDAAiD,MAAM,CAAC,CAAC,IAAI,CAAC,KAAK,MAAM,CAAC,CAAC,IAAI,CAAC,GAAG;iBACtF,CAAC,CAAC;gBACH,MAAM;YACV,KAAK,MAAM;gBACP,8CAA8C;gBAC9C,IAAI,CAAC;oBACD,MAAM,aAAa,CAAC,UAAU,EAAE,CAAC,KAAK,MAAM,CAAC,CAAC,IAAI,CAAC,IAAI,MAAM,CAAC,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC;gBAC7E,CAAC;gBAAC,MAAM,CAAC;oBACL,qEAAqE;gBACzE,CAAC;gBACD,MAAM;YACV;gBACI,MAAM,IAAI,KAAK,CAAC,gBAAgB,MAAM,CAAC,IAAI,6BAA6B,CAAC,CAAC;QAClF,CAAC;IACL,CAAC;IAEO,KAAK,CAAC,WAAW,CAAC,MAAsB;QAC5C,QAAQ,MAAM,CAAC,IAAI,EAAE,CAAC;YAClB,KAAK,MAAM;gBACP,MAAM,aAAa,CAAC,WAAW,EAAE,CAAC,IAAI;oBAClC,kDAAkD,CAAC,MAAM,CAAC,IAAI,IAAI,EAAE,CAAC,CAAC,OAAO,CAAC,IAAI,EAAE,KAAK,CAAC,GAAG;iBAChG,CAAC,CAAC;gBACH,MAAM;YACV,KAAK,OAAO;gBACR,MAAM,aAAa,CAAC,WAAW,EAAE,CAAC,IAAI;oBAClC,gDAAgD,IAAI,CAAC,UAAU,CAAC,MAAM,CAAC,GAAG,IAAI,EAAE,CAAC,EAAE;iBACtF,CAAC,CAAC;gBACH,MAAM;YACV,KAAK,QAAQ,CAAC,CAAC,CAAC;gBACZ,MAAM,IAAI,GAAG,CAAC,MAAM,CAAC,SAAS,IAAI,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAC1C,CAAC,KAAK,MAAM,CAAC,CAAC,CAAC,cAAc,CAAC,CAAC,CAAC,CAAC,KAAK,KAAK,CAAC,CAAC,CAAC,aAAa,CAAC,CAAC,CAAC,CAAC,KAAK,MAAM,CAAC,CAAC,CAAC,cAAc,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAC5G,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;gBACb,MAAM,aAAa,CAAC,WAAW,EAAE,CAAC,IAAI;oBAClC,kDAAkD,MAAM,CAAC,GAAG,YAAY,IAAI,GAAG;iBAClF,CAAC,CAAC;gBACH,MAAM;YACV,CAAC;QACL,CAAC;IACL,CAAC;IAEO,UAAU,CAAC,GAAW;QAC1B,MAAM,KAAK,GAA2B;YAClC,QAAQ,EAAE,EAAE,EAAE,KAAK,EAAE,EAAE,EAAE,QAAQ,EAAE,EAAE,EAAE,OAAO,EAAE,EAAE;YAClD,QAAQ,EAAE,EAAE,EAAE,IAAI,EAAE,GAAG,EAAE,MAAM,EAAE,GAAG,EAAE,MAAM,EAAE,GAAG,EAAE,OAAO,EAAE,GAAG;SAClE,CAAC;QACF,OAAO,MAAM,CAAC,KAAK,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,CAAC;IACnC,CAAC;IAEO,KAAK,CAAC,EAAU;QACpB,OAAO,IAAI,OAAO,CAAC,OAAO,CAAC,EAAE,CAAC,UAAU,CAAC,OAAO,EAAE,EAAE,CAAC,CAAC,CAAC;IAC3D,CAAC;CACJ"}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import type { ScreenCaptureResult, ScreenRegion } from './types.js';
|
|
2
|
+
export declare class ScreenCapture {
|
|
3
|
+
private tempDir;
|
|
4
|
+
constructor(tempDir?: string);
|
|
5
|
+
/**
|
|
6
|
+
* Capture a full screenshot or a specific region.
|
|
7
|
+
*/
|
|
8
|
+
capture(region?: ScreenRegion): Promise<ScreenCaptureResult>;
|
|
9
|
+
private captureLinux;
|
|
10
|
+
private captureMac;
|
|
11
|
+
private captureWindows;
|
|
12
|
+
/**
|
|
13
|
+
* Clean up all temporary screenshots.
|
|
14
|
+
*/
|
|
15
|
+
cleanup(): void;
|
|
16
|
+
}
|
|
17
|
+
//# sourceMappingURL=screen.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"screen.d.ts","sourceRoot":"","sources":["../../../src/desktop/screen.ts"],"names":[],"mappings":"AAOA,OAAO,KAAK,EAAE,mBAAmB,EAAE,YAAY,EAAE,MAAM,YAAY,CAAC;AAIpE,qBAAa,aAAa;IACtB,OAAO,CAAC,OAAO,CAAS;gBAEZ,OAAO,GAAE,MAA6B;IAOlD;;OAEG;IACG,OAAO,CAAC,MAAM,CAAC,EAAE,YAAY,GAAG,OAAO,CAAC,mBAAmB,CAAC;YA4BpD,YAAY;YAkCZ,UAAU;YASV,cAAc;IAc5B;;OAEG;IACH,OAAO,IAAI,IAAI;CAWlB"}
|
|
@@ -0,0 +1,120 @@
|
|
|
1
|
+
// ─── Screen Capture ───
|
|
2
|
+
// Takes screenshots using platform-native CLI tools (no npm dependencies).
|
|
3
|
+
import { execFile } from 'node:child_process';
|
|
4
|
+
import { promisify } from 'node:util';
|
|
5
|
+
import { existsSync, mkdirSync } from 'node:fs';
|
|
6
|
+
import { join } from 'node:path';
|
|
7
|
+
const execFileAsync = promisify(execFile);
|
|
8
|
+
export class ScreenCapture {
|
|
9
|
+
tempDir;
|
|
10
|
+
constructor(tempDir = '/tmp/agent-desktop') {
|
|
11
|
+
this.tempDir = tempDir;
|
|
12
|
+
if (!existsSync(this.tempDir)) {
|
|
13
|
+
mkdirSync(this.tempDir, { recursive: true });
|
|
14
|
+
}
|
|
15
|
+
}
|
|
16
|
+
/**
|
|
17
|
+
* Capture a full screenshot or a specific region.
|
|
18
|
+
*/
|
|
19
|
+
async capture(region) {
|
|
20
|
+
const filename = `screenshot-${Date.now()}.png`;
|
|
21
|
+
const filepath = join(this.tempDir, filename);
|
|
22
|
+
const platform = process.platform;
|
|
23
|
+
try {
|
|
24
|
+
if (platform === 'linux') {
|
|
25
|
+
await this.captureLinux(filepath, region);
|
|
26
|
+
}
|
|
27
|
+
else if (platform === 'darwin') {
|
|
28
|
+
await this.captureMac(filepath, region);
|
|
29
|
+
}
|
|
30
|
+
else if (platform === 'win32') {
|
|
31
|
+
await this.captureWindows(filepath, region);
|
|
32
|
+
}
|
|
33
|
+
else {
|
|
34
|
+
throw new Error(`Unsupported platform: ${platform}`);
|
|
35
|
+
}
|
|
36
|
+
return {
|
|
37
|
+
path: filepath,
|
|
38
|
+
width: region?.width ?? 0,
|
|
39
|
+
height: region?.height ?? 0,
|
|
40
|
+
format: 'png',
|
|
41
|
+
timestamp: new Date(),
|
|
42
|
+
};
|
|
43
|
+
}
|
|
44
|
+
catch (err) {
|
|
45
|
+
throw new Error(`Screenshot failed: ${err.message}`);
|
|
46
|
+
}
|
|
47
|
+
}
|
|
48
|
+
async captureLinux(filepath, region) {
|
|
49
|
+
// Try multiple tools in order of preference
|
|
50
|
+
const tools = ['gnome-screenshot', 'scrot', 'import'];
|
|
51
|
+
for (const tool of tools) {
|
|
52
|
+
try {
|
|
53
|
+
if (tool === 'gnome-screenshot') {
|
|
54
|
+
const args = ['-f', filepath];
|
|
55
|
+
if (region) {
|
|
56
|
+
args.push('-a'); // area mode fallback
|
|
57
|
+
}
|
|
58
|
+
await execFileAsync('gnome-screenshot', args, { timeout: 10000 });
|
|
59
|
+
return;
|
|
60
|
+
}
|
|
61
|
+
else if (tool === 'scrot') {
|
|
62
|
+
const args = region
|
|
63
|
+
? ['-a', `${region.x},${region.y},${region.width},${region.height}`, filepath]
|
|
64
|
+
: [filepath];
|
|
65
|
+
await execFileAsync('scrot', args, { timeout: 10000 });
|
|
66
|
+
return;
|
|
67
|
+
}
|
|
68
|
+
else if (tool === 'import') {
|
|
69
|
+
// ImageMagick
|
|
70
|
+
const args = region
|
|
71
|
+
? ['-window', 'root', '-crop', `${region.width}x${region.height}+${region.x}+${region.y}`, filepath]
|
|
72
|
+
: ['-window', 'root', filepath];
|
|
73
|
+
await execFileAsync('import', args, { timeout: 10000 });
|
|
74
|
+
return;
|
|
75
|
+
}
|
|
76
|
+
}
|
|
77
|
+
catch {
|
|
78
|
+
continue; // Try next tool
|
|
79
|
+
}
|
|
80
|
+
}
|
|
81
|
+
throw new Error('No screenshot tool found. Install scrot, gnome-screenshot, or ImageMagick.');
|
|
82
|
+
}
|
|
83
|
+
async captureMac(filepath, region) {
|
|
84
|
+
const args = ['-c', '-x']; // clipboard, no sound
|
|
85
|
+
if (region) {
|
|
86
|
+
args.push('-R', `${region.x},${region.y},${region.width},${region.height}`);
|
|
87
|
+
}
|
|
88
|
+
args.push(filepath);
|
|
89
|
+
await execFileAsync('screencapture', args, { timeout: 10000 });
|
|
90
|
+
}
|
|
91
|
+
async captureWindows(filepath, _region) {
|
|
92
|
+
// PowerShell screenshot command
|
|
93
|
+
const script = `
|
|
94
|
+
Add-Type -AssemblyName System.Windows.Forms;
|
|
95
|
+
[System.Windows.Forms.Screen]::PrimaryScreen | ForEach-Object {
|
|
96
|
+
$bmp = New-Object System.Drawing.Bitmap($_.Bounds.Width, $_.Bounds.Height);
|
|
97
|
+
$graphics = [System.Drawing.Graphics]::FromImage($bmp);
|
|
98
|
+
$graphics.CopyFromScreen($_.Bounds.Location, [System.Drawing.Point]::Empty, $_.Bounds.Size);
|
|
99
|
+
$bmp.Save('${filepath.replace(/\\/g, '\\\\')}');
|
|
100
|
+
}
|
|
101
|
+
`;
|
|
102
|
+
await execFileAsync('powershell', ['-Command', script], { timeout: 10000 });
|
|
103
|
+
}
|
|
104
|
+
/**
|
|
105
|
+
* Clean up all temporary screenshots.
|
|
106
|
+
*/
|
|
107
|
+
cleanup() {
|
|
108
|
+
try {
|
|
109
|
+
const { readdirSync, unlinkSync } = require('node:fs');
|
|
110
|
+
const files = readdirSync(this.tempDir);
|
|
111
|
+
for (const f of files) {
|
|
112
|
+
if (f.startsWith('screenshot-')) {
|
|
113
|
+
unlinkSync(join(this.tempDir, f));
|
|
114
|
+
}
|
|
115
|
+
}
|
|
116
|
+
}
|
|
117
|
+
catch { /* ignore */ }
|
|
118
|
+
}
|
|
119
|
+
}
|
|
120
|
+
//# sourceMappingURL=screen.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"screen.js","sourceRoot":"","sources":["../../../src/desktop/screen.ts"],"names":[],"mappings":"AAAA,yBAAyB;AACzB,2EAA2E;AAE3E,OAAO,EAAE,QAAQ,EAAE,MAAM,oBAAoB,CAAC;AAC9C,OAAO,EAAE,SAAS,EAAE,MAAM,WAAW,CAAC;AACtC,OAAO,EAAE,UAAU,EAAE,SAAS,EAAE,MAAM,SAAS,CAAC;AAChD,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAC;AAGjC,MAAM,aAAa,GAAG,SAAS,CAAC,QAAQ,CAAC,CAAC;AAE1C,MAAM,OAAO,aAAa;IACd,OAAO,CAAS;IAExB,YAAY,UAAkB,oBAAoB;QAC9C,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC;QACvB,IAAI,CAAC,UAAU,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE,CAAC;YAC5B,SAAS,CAAC,IAAI,CAAC,OAAO,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;QACjD,CAAC;IACL,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,OAAO,CAAC,MAAqB;QAC/B,MAAM,QAAQ,GAAG,cAAc,IAAI,CAAC,GAAG,EAAE,MAAM,CAAC;QAChD,MAAM,QAAQ,GAAG,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,QAAQ,CAAC,CAAC;QAC9C,MAAM,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QAElC,IAAI,CAAC;YACD,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;gBACvB,MAAM,IAAI,CAAC,YAAY,CAAC,QAAQ,EAAE,MAAM,CAAC,CAAC;YAC9C,CAAC;iBAAM,IAAI,QAAQ,KAAK,QAAQ,EAAE,CAAC;gBAC/B,MAAM,IAAI,CAAC,UAAU,CAAC,QAAQ,EAAE,MAAM,CAAC,CAAC;YAC5C,CAAC;iBAAM,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;gBAC9B,MAAM,IAAI,CAAC,cAAc,CAAC,QAAQ,EAAE,MAAM,CAAC,CAAC;YAChD,CAAC;iBAAM,CAAC;gBACJ,MAAM,IAAI,KAAK,CAAC,yBAAyB,QAAQ,EAAE,CAAC,CAAC;YACzD,CAAC;YAED,OAAO;gBACH,IAAI,EAAE,QAAQ;gBACd,KAAK,EAAE,MAAM,EAAE,KAAK,IAAI,CAAC;gBACzB,MAAM,EAAE,MAAM,EAAE,MAAM,IAAI,CAAC;gBAC3B,MAAM,EAAE,KAAK;gBACb,SAAS,EAAE,IAAI,IAAI,EAAE;aACxB,CAAC;QACN,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,MAAM,IAAI,KAAK,CAAC,sBAAuB,GAAa,CAAC,OAAO,EAAE,CAAC,CAAC;QACpE,CAAC;IACL,CAAC;IAEO,KAAK,CAAC,YAAY,CAAC,QAAgB,EAAE,MAAqB;QAC9D,4CAA4C;QAC5C,MAAM,KAAK,GAAG,CAAC,kBAAkB,EAAE,OAAO,EAAE,QAAQ,CAAC,CAAC;QAEtD,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;YACvB,IAAI,CAAC;gBACD,IAAI,IAAI,KAAK,kBAAkB,EAAE,CAAC;oBAC9B,MAAM,IAAI,GAAG,CAAC,IAAI,EAAE,QAAQ,CAAC,CAAC;oBAC9B,IAAI,MAAM,EAAE,CAAC;wBACT,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,qBAAqB;oBAC1C,CAAC;oBACD,MAAM,aAAa,CAAC,kBAAkB,EAAE,IAAI,EAAE,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC,CAAC;oBAClE,OAAO;gBACX,CAAC;qBAAM,IAAI,IAAI,KAAK,OAAO,EAAE,CAAC;oBAC1B,MAAM,IAAI,GAAG,MAAM;wBACf,CAAC,CAAC,CAAC,IAAI,EAAE,GAAG,MAAM,CAAC,CAAC,IAAI,MAAM,CAAC,CAAC,IAAI,MAAM,CAAC,KAAK,IAAI,MAAM,CAAC,MAAM,EAAE,EAAE,QAAQ,CAAC;wBAC9E,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC;oBACjB,MAAM,aAAa,CAAC,OAAO,EAAE,IAAI,EAAE,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC,CAAC;oBACvD,OAAO;gBACX,CAAC;qBAAM,IAAI,IAAI,KAAK,QAAQ,EAAE,CAAC;oBAC3B,cAAc;oBACd,MAAM,IAAI,GAAG,MAAM;wBACf,CAAC,CAAC,CAAC,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,MAAM,CAAC,KAAK,IAAI,MAAM,CAAC,MAAM,IAAI,MAAM,CAAC,CAAC,IAAI,MAAM,CAAC,CAAC,EAAE,EAAE,QAAQ,CAAC;wBACpG,CAAC,CAAC,CAAC,SAAS,EAAE,MAAM,EAAE,QAAQ,CAAC,CAAC;oBACpC,MAAM,aAAa,CAAC,QAAQ,EAAE,IAAI,EAAE,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC,CAAC;oBACxD,OAAO;gBACX,CAAC;YACL,CAAC;YAAC,MAAM,CAAC;gBACL,SAAS,CAAC,gBAAgB;YAC9B,CAAC;QACL,CAAC;QACD,MAAM,IAAI,KAAK,CAAC,4EAA4E,CAAC,CAAC;IAClG,CAAC;IAEO,KAAK,CAAC,UAAU,CAAC,QAAgB,EAAE,MAAqB;QAC5D,MAAM,IAAI,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC,CAAC,sBAAsB;QACjD,IAAI,MAAM,EAAE,CAAC;YACT,IAAI,CAAC,IAAI,CAAC,IAAI,EAAE,GAAG,MAAM,CAAC,CAAC,IAAI,MAAM,CAAC,CAAC,IAAI,MAAM,CAAC,KAAK,IAAI,MAAM,CAAC,MAAM,EAAE,CAAC,CAAC;QAChF,CAAC;QACD,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACpB,MAAM,aAAa,CAAC,eAAe,EAAE,IAAI,EAAE,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC,CAAC;IACnE,CAAC;IAEO,KAAK,CAAC,cAAc,CAAC,QAAgB,EAAE,OAAsB;QACjE,gCAAgC;QAChC,MAAM,MAAM,GAAG;;;;;;6BAMM,QAAQ,CAAC,OAAO,CAAC,KAAK,EAAE,MAAM,CAAC;;SAEnD,CAAC;QACF,MAAM,aAAa,CAAC,YAAY,EAAE,CAAC,UAAU,EAAE,MAAM,CAAC,EAAE,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC,CAAC;IAChF,CAAC;IAED;;OAEG;IACH,OAAO;QACH,IAAI,CAAC;YACD,MAAM,EAAE,WAAW,EAAE,UAAU,EAAE,GAAG,OAAO,CAAC,SAAS,CAAC,CAAC;YACvD,MAAM,KAAK,GAAG,WAAW,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;YACxC,KAAK,MAAM,CAAC,IAAI,KAAK,EAAE,CAAC;gBACpB,IAAI,CAAC,CAAC,UAAU,CAAC,aAAa,CAAC,EAAE,CAAC;oBAC9B,UAAU,CAAC,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC,CAAC;gBACtC,CAAC;YACL,CAAC;QACL,CAAC;QAAC,MAAM,CAAC,CAAC,YAAY,CAAC,CAAC;IAC5B,CAAC;CACJ"}
|
|
@@ -0,0 +1,50 @@
|
|
|
1
|
+
export interface DesktopConfig {
|
|
2
|
+
/** Enable desktop automation */
|
|
3
|
+
enabled: boolean;
|
|
4
|
+
/** Screenshot format */
|
|
5
|
+
screenshotFormat: 'png' | 'jpg';
|
|
6
|
+
/** Screenshot quality (jpg only, 1-100) */
|
|
7
|
+
screenshotQuality: number;
|
|
8
|
+
/** Default delay between actions (ms) */
|
|
9
|
+
actionDelay: number;
|
|
10
|
+
/** Whether to use OCR on screenshots */
|
|
11
|
+
ocrEnabled: boolean;
|
|
12
|
+
/** Temporary directory for screenshots */
|
|
13
|
+
tempDir: string;
|
|
14
|
+
}
|
|
15
|
+
export declare const DEFAULT_DESKTOP_CONFIG: DesktopConfig;
|
|
16
|
+
export interface ScreenRegion {
|
|
17
|
+
x: number;
|
|
18
|
+
y: number;
|
|
19
|
+
width: number;
|
|
20
|
+
height: number;
|
|
21
|
+
}
|
|
22
|
+
export interface MouseAction {
|
|
23
|
+
type: 'click' | 'doubleClick' | 'rightClick' | 'move' | 'drag' | 'scroll';
|
|
24
|
+
x?: number;
|
|
25
|
+
y?: number;
|
|
26
|
+
toX?: number;
|
|
27
|
+
toY?: number;
|
|
28
|
+
scrollAmount?: number;
|
|
29
|
+
button?: 'left' | 'right' | 'middle';
|
|
30
|
+
}
|
|
31
|
+
export interface KeyboardAction {
|
|
32
|
+
type: 'type' | 'press' | 'hotkey';
|
|
33
|
+
text?: string;
|
|
34
|
+
key?: string;
|
|
35
|
+
modifiers?: Array<'ctrl' | 'alt' | 'shift' | 'meta'>;
|
|
36
|
+
}
|
|
37
|
+
export interface ScreenCaptureResult {
|
|
38
|
+
path: string;
|
|
39
|
+
width: number;
|
|
40
|
+
height: number;
|
|
41
|
+
format: string;
|
|
42
|
+
timestamp: Date;
|
|
43
|
+
}
|
|
44
|
+
export interface DesktopActionResult {
|
|
45
|
+
success: boolean;
|
|
46
|
+
action: string;
|
|
47
|
+
error?: string;
|
|
48
|
+
screenshot?: ScreenCaptureResult;
|
|
49
|
+
}
|
|
50
|
+
//# sourceMappingURL=types.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../../../src/desktop/types.ts"],"names":[],"mappings":"AAEA,MAAM,WAAW,aAAa;IAC1B,gCAAgC;IAChC,OAAO,EAAE,OAAO,CAAC;IACjB,wBAAwB;IACxB,gBAAgB,EAAE,KAAK,GAAG,KAAK,CAAC;IAChC,2CAA2C;IAC3C,iBAAiB,EAAE,MAAM,CAAC;IAC1B,yCAAyC;IACzC,WAAW,EAAE,MAAM,CAAC;IACpB,wCAAwC;IACxC,UAAU,EAAE,OAAO,CAAC;IACpB,0CAA0C;IAC1C,OAAO,EAAE,MAAM,CAAC;CACnB;AAED,eAAO,MAAM,sBAAsB,EAAE,aAOpC,CAAC;AAEF,MAAM,WAAW,YAAY;IACzB,CAAC,EAAE,MAAM,CAAC;IACV,CAAC,EAAE,MAAM,CAAC;IACV,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,WAAW;IACxB,IAAI,EAAE,OAAO,GAAG,aAAa,GAAG,YAAY,GAAG,MAAM,GAAG,MAAM,GAAG,QAAQ,CAAC;IAC1E,CAAC,CAAC,EAAE,MAAM,CAAC;IACX,CAAC,CAAC,EAAE,MAAM,CAAC;IACX,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,MAAM,CAAC,EAAE,MAAM,GAAG,OAAO,GAAG,QAAQ,CAAC;CACxC;AAED,MAAM,WAAW,cAAc;IAC3B,IAAI,EAAE,MAAM,GAAG,OAAO,GAAG,QAAQ,CAAC;IAClC,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,SAAS,CAAC,EAAE,KAAK,CAAC,MAAM,GAAG,KAAK,GAAG,OAAO,GAAG,MAAM,CAAC,CAAC;CACxD;AAED,MAAM,WAAW,mBAAmB;IAChC,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,CAAC;IACf,MAAM,EAAE,MAAM,CAAC;IACf,SAAS,EAAE,IAAI,CAAC;CACnB;AAED,MAAM,WAAW,mBAAmB;IAChC,OAAO,EAAE,OAAO,CAAC;IACjB,MAAM,EAAE,MAAM,CAAC;IACf,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,UAAU,CAAC,EAAE,mBAAmB,CAAC;CACpC"}
|
|
@@ -0,0 +1,10 @@
|
|
|
1
|
+
// ─── Desktop Automation Types ───
|
|
2
|
+
export const DEFAULT_DESKTOP_CONFIG = {
|
|
3
|
+
enabled: false,
|
|
4
|
+
screenshotFormat: 'png',
|
|
5
|
+
screenshotQuality: 80,
|
|
6
|
+
actionDelay: 100,
|
|
7
|
+
ocrEnabled: false,
|
|
8
|
+
tempDir: '/tmp/agent-desktop',
|
|
9
|
+
};
|
|
10
|
+
//# sourceMappingURL=types.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.js","sourceRoot":"","sources":["../../../src/desktop/types.ts"],"names":[],"mappings":"AAAA,mCAAmC;AAiBnC,MAAM,CAAC,MAAM,sBAAsB,GAAkB;IACjD,OAAO,EAAE,KAAK;IACd,gBAAgB,EAAE,KAAK;IACvB,iBAAiB,EAAE,EAAE;IACrB,WAAW,EAAE,GAAG;IAChB,UAAU,EAAE,KAAK;IACjB,OAAO,EAAE,oBAAoB;CAChC,CAAC"}
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
import type { MultimodalConfig, TranscriptionResult, VisionAnalysisResult, SpeechResult } from './types.js';
|
|
2
|
+
export declare class MultimodalEngine {
|
|
3
|
+
private config;
|
|
4
|
+
private voice;
|
|
5
|
+
private vision;
|
|
6
|
+
private tts;
|
|
7
|
+
constructor(config?: Partial<MultimodalConfig>);
|
|
8
|
+
get enabled(): boolean;
|
|
9
|
+
/**
|
|
10
|
+
* Transcribe audio to text (speech-to-text).
|
|
11
|
+
*/
|
|
12
|
+
transcribe(audioPath: string): Promise<TranscriptionResult>;
|
|
13
|
+
/**
|
|
14
|
+
* Analyze an image with a text prompt (vision).
|
|
15
|
+
*/
|
|
16
|
+
analyzeImage(imagePath: string, prompt?: string): Promise<VisionAnalysisResult>;
|
|
17
|
+
/**
|
|
18
|
+
* Analyze an image from a URL.
|
|
19
|
+
*/
|
|
20
|
+
analyzeImageUrl(url: string, prompt?: string): Promise<VisionAnalysisResult>;
|
|
21
|
+
/**
|
|
22
|
+
* Convert text to speech.
|
|
23
|
+
*/
|
|
24
|
+
speak(text: string, outputDir?: string): Promise<SpeechResult>;
|
|
25
|
+
/**
|
|
26
|
+
* Full pipeline: take a screenshot → analyze it → describe what's on screen.
|
|
27
|
+
* (Requires desktop module integration)
|
|
28
|
+
*/
|
|
29
|
+
describeScreen(screenshotPath: string): Promise<VisionAnalysisResult>;
|
|
30
|
+
}
|
|
31
|
+
export declare function getMultimodalEngine(): MultimodalEngine | null;
|
|
32
|
+
export declare function initMultimodalEngine(config?: Partial<MultimodalConfig>): MultimodalEngine;
|
|
33
|
+
//# sourceMappingURL=engine.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"engine.d.ts","sourceRoot":"","sources":["../../../src/multimodal/engine.ts"],"names":[],"mappings":"AAMA,OAAO,KAAK,EAAE,gBAAgB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,YAAY,EAAE,MAAM,YAAY,CAAC;AAG5G,qBAAa,gBAAgB;IACzB,OAAO,CAAC,MAAM,CAAmB;IACjC,OAAO,CAAC,KAAK,CAAa;IAC1B,OAAO,CAAC,MAAM,CAAiB;IAC/B,OAAO,CAAC,GAAG,CAAe;gBAEd,MAAM,CAAC,EAAE,OAAO,CAAC,gBAAgB,CAAC;IAS9C,IAAI,OAAO,IAAI,OAAO,CAErB;IAED;;OAEG;IACG,UAAU,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,mBAAmB,CAAC;IAIjE;;OAEG;IACG,YAAY,CAAC,SAAS,EAAE,MAAM,EAAE,MAAM,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC,oBAAoB,CAAC;IAIrF;;OAEG;IACG,eAAe,CAAC,GAAG,EAAE,MAAM,EAAE,MAAM,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC,oBAAoB,CAAC;IAIlF;;OAEG;IACG,KAAK,CAAC,IAAI,EAAE,MAAM,EAAE,SAAS,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC,YAAY,CAAC;IAIpE;;;OAGG;IACG,cAAc,CAAC,cAAc,EAAE,MAAM,GAAG,OAAO,CAAC,oBAAoB,CAAC;CAG9E;AAKD,wBAAgB,mBAAmB,IAAI,gBAAgB,GAAG,IAAI,CAE7D;AAED,wBAAgB,oBAAoB,CAAC,MAAM,CAAC,EAAE,OAAO,CAAC,gBAAgB,CAAC,GAAG,gBAAgB,CAGzF"}
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
// ─── Multimodal Engine ───
|
|
2
|
+
// Unified interface for voice input, image analysis, and text-to-speech.
|
|
3
|
+
import { VoiceInput } from './voice.js';
|
|
4
|
+
import { VisionAnalyzer } from './vision.js';
|
|
5
|
+
import { TextToSpeech } from './tts.js';
|
|
6
|
+
import { DEFAULT_MULTIMODAL_CONFIG } from './types.js';
|
|
7
|
+
export class MultimodalEngine {
|
|
8
|
+
config;
|
|
9
|
+
voice;
|
|
10
|
+
vision;
|
|
11
|
+
tts;
|
|
12
|
+
constructor(config) {
|
|
13
|
+
this.config = { ...DEFAULT_MULTIMODAL_CONFIG, ...config };
|
|
14
|
+
const apiKey = this.config.apiKey || process.env.OPENAI_API_KEY || '';
|
|
15
|
+
this.voice = new VoiceInput(this.config.voice, apiKey);
|
|
16
|
+
this.vision = new VisionAnalyzer(this.config.vision, apiKey);
|
|
17
|
+
this.tts = new TextToSpeech(this.config.tts, apiKey);
|
|
18
|
+
}
|
|
19
|
+
get enabled() {
|
|
20
|
+
return this.config.enabled;
|
|
21
|
+
}
|
|
22
|
+
/**
|
|
23
|
+
* Transcribe audio to text (speech-to-text).
|
|
24
|
+
*/
|
|
25
|
+
async transcribe(audioPath) {
|
|
26
|
+
return this.voice.transcribe(audioPath);
|
|
27
|
+
}
|
|
28
|
+
/**
|
|
29
|
+
* Analyze an image with a text prompt (vision).
|
|
30
|
+
*/
|
|
31
|
+
async analyzeImage(imagePath, prompt) {
|
|
32
|
+
return this.vision.analyze(imagePath, prompt);
|
|
33
|
+
}
|
|
34
|
+
/**
|
|
35
|
+
* Analyze an image from a URL.
|
|
36
|
+
*/
|
|
37
|
+
async analyzeImageUrl(url, prompt) {
|
|
38
|
+
return this.vision.analyzeUrl(url, prompt);
|
|
39
|
+
}
|
|
40
|
+
/**
|
|
41
|
+
* Convert text to speech.
|
|
42
|
+
*/
|
|
43
|
+
async speak(text, outputDir) {
|
|
44
|
+
return this.tts.speak(text, outputDir);
|
|
45
|
+
}
|
|
46
|
+
/**
|
|
47
|
+
* Full pipeline: take a screenshot → analyze it → describe what's on screen.
|
|
48
|
+
* (Requires desktop module integration)
|
|
49
|
+
*/
|
|
50
|
+
async describeScreen(screenshotPath) {
|
|
51
|
+
return this.vision.analyze(screenshotPath, 'Describe what is shown on this screen in detail. Identify any UI elements, text, and interactive components.');
|
|
52
|
+
}
|
|
53
|
+
}
|
|
54
|
+
// ─── Singleton ───
|
|
55
|
+
let multimodalInstance = null;
|
|
56
|
+
export function getMultimodalEngine() {
|
|
57
|
+
return multimodalInstance;
|
|
58
|
+
}
|
|
59
|
+
export function initMultimodalEngine(config) {
|
|
60
|
+
multimodalInstance = new MultimodalEngine(config);
|
|
61
|
+
return multimodalInstance;
|
|
62
|
+
}
|
|
63
|
+
//# sourceMappingURL=engine.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"engine.js","sourceRoot":"","sources":["../../../src/multimodal/engine.ts"],"names":[],"mappings":"AAAA,4BAA4B;AAC5B,yEAAyE;AAEzE,OAAO,EAAE,UAAU,EAAE,MAAM,YAAY,CAAC;AACxC,OAAO,EAAE,cAAc,EAAE,MAAM,aAAa,CAAC;AAC7C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AAExC,OAAO,EAAE,yBAAyB,EAAE,MAAM,YAAY,CAAC;AAEvD,MAAM,OAAO,gBAAgB;IACjB,MAAM,CAAmB;IACzB,KAAK,CAAa;IAClB,MAAM,CAAiB;IACvB,GAAG,CAAe;IAE1B,YAAY,MAAkC;QAC1C,IAAI,CAAC,MAAM,GAAG,EAAE,GAAG,yBAAyB,EAAE,GAAG,MAAM,EAAE,CAAC;QAC1D,MAAM,MAAM,GAAG,IAAI,CAAC,MAAM,CAAC,MAAM,IAAI,OAAO,CAAC,GAAG,CAAC,cAAc,IAAI,EAAE,CAAC;QAEtE,IAAI,CAAC,KAAK,GAAG,IAAI,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC,KAAK,EAAE,MAAM,CAAC,CAAC;QACvD,IAAI,CAAC,MAAM,GAAG,IAAI,cAAc,CAAC,IAAI,CAAC,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;QAC7D,IAAI,CAAC,GAAG,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,MAAM,CAAC,GAAG,EAAE,MAAM,CAAC,CAAC;IACzD,CAAC;IAED,IAAI,OAAO;QACP,OAAO,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC;IAC/B,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,UAAU,CAAC,SAAiB;QAC9B,OAAO,IAAI,CAAC,KAAK,CAAC,UAAU,CAAC,SAAS,CAAC,CAAC;IAC5C,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,YAAY,CAAC,SAAiB,EAAE,MAAe;QACjD,OAAO,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,SAAS,EAAE,MAAM,CAAC,CAAC;IAClD,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,eAAe,CAAC,GAAW,EAAE,MAAe;QAC9C,OAAO,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,GAAG,EAAE,MAAM,CAAC,CAAC;IAC/C,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,KAAK,CAAC,IAAY,EAAE,SAAkB;QACxC,OAAO,IAAI,CAAC,GAAG,CAAC,KAAK,CAAC,IAAI,EAAE,SAAS,CAAC,CAAC;IAC3C,CAAC;IAED;;;OAGG;IACH,KAAK,CAAC,cAAc,CAAC,cAAsB;QACvC,OAAO,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,cAAc,EAAE,8GAA8G,CAAC,CAAC;IAC/J,CAAC;CACJ;AAED,oBAAoB;AACpB,IAAI,kBAAkB,GAA4B,IAAI,CAAC;AAEvD,MAAM,UAAU,mBAAmB;IAC/B,OAAO,kBAAkB,CAAC;AAC9B,CAAC;AAED,MAAM,UAAU,oBAAoB,CAAC,MAAkC;IACnE,kBAAkB,GAAG,IAAI,gBAAgB,CAAC,MAAM,CAAC,CAAC;IAClD,OAAO,kBAAkB,CAAC;AAC9B,CAAC"}
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
export { MultimodalEngine, getMultimodalEngine, initMultimodalEngine } from './engine.js';
|
|
2
|
+
export { VoiceInput } from './voice.js';
|
|
3
|
+
export { VisionAnalyzer } from './vision.js';
|
|
4
|
+
export { TextToSpeech } from './tts.js';
|
|
5
|
+
export type { MultimodalConfig, VoiceConfig, VisionConfig, TTSConfig, TranscriptionResult, VisionAnalysisResult, SpeechResult } from './types.js';
|
|
6
|
+
export { DEFAULT_MULTIMODAL_CONFIG } from './types.js';
|
|
7
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/multimodal/index.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,gBAAgB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,aAAa,CAAC;AAC1F,OAAO,EAAE,UAAU,EAAE,MAAM,YAAY,CAAC;AACxC,OAAO,EAAE,cAAc,EAAE,MAAM,aAAa,CAAC;AAC7C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AACxC,YAAY,EAAE,gBAAgB,EAAE,WAAW,EAAE,YAAY,EAAE,SAAS,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,YAAY,EAAE,MAAM,YAAY,CAAC;AAClJ,OAAO,EAAE,yBAAyB,EAAE,MAAM,YAAY,CAAC"}
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
// ─── Multimodal Module Index ───
|
|
2
|
+
export { MultimodalEngine, getMultimodalEngine, initMultimodalEngine } from './engine.js';
|
|
3
|
+
export { VoiceInput } from './voice.js';
|
|
4
|
+
export { VisionAnalyzer } from './vision.js';
|
|
5
|
+
export { TextToSpeech } from './tts.js';
|
|
6
|
+
export { DEFAULT_MULTIMODAL_CONFIG } from './types.js';
|
|
7
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/multimodal/index.ts"],"names":[],"mappings":"AAAA,kCAAkC;AAClC,OAAO,EAAE,gBAAgB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,aAAa,CAAC;AAC1F,OAAO,EAAE,UAAU,EAAE,MAAM,YAAY,CAAC;AACxC,OAAO,EAAE,cAAc,EAAE,MAAM,aAAa,CAAC;AAC7C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AAExC,OAAO,EAAE,yBAAyB,EAAE,MAAM,YAAY,CAAC"}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import type { TTSConfig, SpeechResult } from './types.js';
|
|
2
|
+
export declare class TextToSpeech {
|
|
3
|
+
private config;
|
|
4
|
+
private apiKey;
|
|
5
|
+
constructor(config: TTSConfig, apiKey: string);
|
|
6
|
+
/**
|
|
7
|
+
* Convert text to speech and save as an audio file.
|
|
8
|
+
*/
|
|
9
|
+
speak(text: string, outputDir?: string): Promise<SpeechResult>;
|
|
10
|
+
}
|
|
11
|
+
//# sourceMappingURL=tts.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tts.d.ts","sourceRoot":"","sources":["../../../src/multimodal/tts.ts"],"names":[],"mappings":"AAKA,OAAO,KAAK,EAAE,SAAS,EAAE,YAAY,EAAE,MAAM,YAAY,CAAC;AAE1D,qBAAa,YAAY;IACrB,OAAO,CAAC,MAAM,CAAY;IAC1B,OAAO,CAAC,MAAM,CAAS;gBAEX,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM;IAK7C;;OAEG;IACG,KAAK,CAAC,IAAI,EAAE,MAAM,EAAE,SAAS,GAAE,MAAyB,GAAG,OAAO,CAAC,YAAY,CAAC;CAqCzF"}
|
|
@@ -0,0 +1,48 @@
|
|
|
1
|
+
// ─── Text-to-Speech ───
|
|
2
|
+
// Uses OpenAI TTS API to generate spoken audio.
|
|
3
|
+
import { writeFileSync } from 'node:fs';
|
|
4
|
+
import { join } from 'node:path';
|
|
5
|
+
export class TextToSpeech {
|
|
6
|
+
config;
|
|
7
|
+
apiKey;
|
|
8
|
+
constructor(config, apiKey) {
|
|
9
|
+
this.config = config;
|
|
10
|
+
this.apiKey = apiKey;
|
|
11
|
+
}
|
|
12
|
+
/**
|
|
13
|
+
* Convert text to speech and save as an audio file.
|
|
14
|
+
*/
|
|
15
|
+
async speak(text, outputDir = '/tmp/agent-tts') {
|
|
16
|
+
const res = await fetch('https://api.openai.com/v1/audio/speech', {
|
|
17
|
+
method: 'POST',
|
|
18
|
+
headers: {
|
|
19
|
+
'Content-Type': 'application/json',
|
|
20
|
+
'Authorization': `Bearer ${this.apiKey}`,
|
|
21
|
+
},
|
|
22
|
+
body: JSON.stringify({
|
|
23
|
+
model: this.config.model,
|
|
24
|
+
input: text,
|
|
25
|
+
voice: this.config.voice,
|
|
26
|
+
response_format: this.config.format,
|
|
27
|
+
speed: this.config.speed,
|
|
28
|
+
}),
|
|
29
|
+
});
|
|
30
|
+
if (!res.ok) {
|
|
31
|
+
const err = await res.json();
|
|
32
|
+
throw new Error(`TTS API Error: ${err.error?.message || JSON.stringify(err)}`);
|
|
33
|
+
}
|
|
34
|
+
const audioBuffer = Buffer.from(await res.arrayBuffer());
|
|
35
|
+
const filename = `speech-${Date.now()}.${this.config.format}`;
|
|
36
|
+
const outputPath = join(outputDir, filename);
|
|
37
|
+
// Ensure output dir exists
|
|
38
|
+
const { mkdirSync } = require('node:fs');
|
|
39
|
+
mkdirSync(outputDir, { recursive: true });
|
|
40
|
+
writeFileSync(outputPath, audioBuffer);
|
|
41
|
+
return {
|
|
42
|
+
audioPath: outputPath,
|
|
43
|
+
format: this.config.format,
|
|
44
|
+
text: text.slice(0, 100) + (text.length > 100 ? '...' : ''),
|
|
45
|
+
};
|
|
46
|
+
}
|
|
47
|
+
}
|
|
48
|
+
//# sourceMappingURL=tts.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tts.js","sourceRoot":"","sources":["../../../src/multimodal/tts.ts"],"names":[],"mappings":"AAAA,yBAAyB;AACzB,gDAAgD;AAEhD,OAAO,EAAE,aAAa,EAAE,MAAM,SAAS,CAAC;AACxC,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAC;AAGjC,MAAM,OAAO,YAAY;IACb,MAAM,CAAY;IAClB,MAAM,CAAS;IAEvB,YAAY,MAAiB,EAAE,MAAc;QACzC,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;QACrB,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;IACzB,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,KAAK,CAAC,IAAY,EAAE,YAAoB,gBAAgB;QAC1D,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,wCAAwC,EAAE;YAC9D,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACL,cAAc,EAAE,kBAAkB;gBAClC,eAAe,EAAE,UAAU,IAAI,CAAC,MAAM,EAAE;aAC3C;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC;gBACjB,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAK;gBACxB,KAAK,EAAE,IAAI;gBACX,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAK;gBACxB,eAAe,EAAE,IAAI,CAAC,MAAM,CAAC,MAAM;gBACnC,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAK;aAC3B,CAAC;SACL,CAAC,CAAC;QAEH,IAAI,CAAC,GAAG,CAAC,EAAE,EAAE,CAAC;YACV,MAAM,GAAG,GAAG,MAAM,GAAG,CAAC,IAAI,EAAS,CAAC;YACpC,MAAM,IAAI,KAAK,CAAC,kBAAkB,GAAG,CAAC,KAAK,EAAE,OAAO,IAAI,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACnF,CAAC;QAED,MAAM,WAAW,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,WAAW,EAAE,CAAC,CAAC;QACzD,MAAM,QAAQ,GAAG,UAAU,IAAI,CAAC,GAAG,EAAE,IAAI,IAAI,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC;QAC9D,MAAM,UAAU,GAAG,IAAI,CAAC,SAAS,EAAE,QAAQ,CAAC,CAAC;QAE7C,2BAA2B;QAC3B,MAAM,EAAE,SAAS,EAAE,GAAG,OAAO,CAAC,SAAS,CAAC,CAAC;QACzC,SAAS,CAAC,SAAS,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;QAE1C,aAAa,CAAC,UAAU,EAAE,WAAW,CAAC,CAAC;QAEvC,OAAO;YACH,SAAS,EAAE,UAAU;YACrB,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,MAAM;YAC1B,IAAI,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC,GAAG,CAAC,IAAI,CAAC,MAAM,GAAG,GAAG,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC;SAC9D,CAAC;IACN,CAAC;CACJ"}
|