0agent 1.0.65 → 1.0.67
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/daemon.mjs +16 -7
- package/package.json +1 -1
package/dist/daemon.mjs
CHANGED
|
@@ -3371,8 +3371,9 @@ var init_CapabilityRegistry = __esm({
|
|
|
3371
3371
|
active.add("scrape_url");
|
|
3372
3372
|
active.add("browser_open");
|
|
3373
3373
|
}
|
|
3374
|
-
if (/click|screenshot|ui|desktop|window|screen|gui|mouse|keyboard|open.*app|fill.*form|navigate.*browser|interact|automate|computer.*use/i.test(lower)) {
|
|
3374
|
+
if (/click|screenshot|ui|desktop|window|screen|gui|mouse|keyboard|open.*app|fill.*form|navigate.*browser|interact|automate|computer.*use|whatsapp|telegram|youtube|music|play|pause|resume|stop|skip|next.*track|prev|send.*message/i.test(lower)) {
|
|
3375
3375
|
active.add("computer_use");
|
|
3376
|
+
active.add("gui_automation");
|
|
3376
3377
|
}
|
|
3377
3378
|
return [...this.capabilities.values()].filter((c) => active.has(c.name)).map((c) => c.toolDefinition);
|
|
3378
3379
|
}
|
|
@@ -3782,12 +3783,20 @@ content = element.text if element else page.get_all_text()` : `content = page.ge
|
|
|
3782
3783
|
if (hasGUI) {
|
|
3783
3784
|
lines.push(
|
|
3784
3785
|
``,
|
|
3785
|
-
`
|
|
3786
|
-
`
|
|
3787
|
-
`
|
|
3788
|
-
`
|
|
3789
|
-
`
|
|
3790
|
-
`
|
|
3786
|
+
`GUI/Browser rules:`,
|
|
3787
|
+
`1. open_url returns actual URL + title + "Video: PLAYING:1.4s \u2713" or "Video: PAUSED".`,
|
|
3788
|
+
` Read it. If video is PAUSED or title shows wrong page \u2014 take corrective action.`,
|
|
3789
|
+
`2. exec_js: run JS in the current Chrome tab \u2014 NO Screen Recording needed.`,
|
|
3790
|
+
` MEDIA CONTROL \u2192 always use exec_js, never hotkey (hotkeys go to Terminal not Chrome):`,
|
|
3791
|
+
` pause: {action:"exec_js",js:"document.querySelector('video').pause()"}`,
|
|
3792
|
+
` play: {action:"exec_js",js:"document.querySelector('video').play()"}`,
|
|
3793
|
+
` check: {action:"exec_js",js:"document.querySelector('video').paused+' t='+document.querySelector('video').currentTime"}`,
|
|
3794
|
+
` click: {action:"exec_js",js:"document.querySelector('.some-selector').click()"}`,
|
|
3795
|
+
`3. hotkey with app param: {action:"hotkey",keys:"k",app:"Google Chrome"} focuses Chrome first,`,
|
|
3796
|
+
` then sends the key via AppleScript (reliable). Without app param, key goes to Terminal.`,
|
|
3797
|
+
`4. browser_state: quickly verify current tab URL + title after any navigation.`,
|
|
3798
|
+
`5. NEVER claim success based on action alone. exec_js to verify: video.paused, page title, etc.`,
|
|
3799
|
+
`6. computer_use: for multi-step desktop tasks \u2014 {task:"full goal description"}. No confirmation.`
|
|
3791
3800
|
);
|
|
3792
3801
|
}
|
|
3793
3802
|
if (isSelfMod && this.agentRoot) {
|