0agent 1.0.55 → 1.0.56
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/daemon.mjs +7 -5
- package/package.json +1 -1
package/dist/daemon.mjs
CHANGED
|
@@ -2599,7 +2599,7 @@ var init_GUICapability = __esm({
|
|
|
2599
2599
|
description = "Automate desktop GUI \u2014 click, type, screenshot, hotkeys, find text on screen.";
|
|
2600
2600
|
toolDefinition = {
|
|
2601
2601
|
name: "gui_automation",
|
|
2602
|
-
description:
|
|
2602
|
+
description: "Desktop GUI automation \u2014 ONLY use for tasks that explicitly require controlling the screen. DO NOT use for coding, research, file edits, or any task that does not need the desktop UI. Actions: click, type, hotkey, scroll, find_and_click, open_url, open_app. screenshot: use sparingly \u2014 only when you cannot proceed without seeing the current screen. Max 2 per task. To open a website use open_url (reuses existing browser tab, never opens duplicate windows).",
|
|
2603
2603
|
input_schema: {
|
|
2604
2604
|
type: "object",
|
|
2605
2605
|
properties: {
|
|
@@ -3497,12 +3497,14 @@ content = element.text if element else page.get_all_text()` : `content = page.ge
|
|
|
3497
3497
|
`- Use relative paths from the working directory`,
|
|
3498
3498
|
`- Be concise in your final response: state what was done and where to find it`,
|
|
3499
3499
|
``,
|
|
3500
|
-
`GUI Automation (gui_automation tool):`,
|
|
3501
|
-
`-
|
|
3502
|
-
`-
|
|
3503
|
-
`-
|
|
3500
|
+
`GUI Automation (gui_automation tool) \u2014 ONLY use when the task explicitly requires controlling the desktop UI:`,
|
|
3501
|
+
`- DO NOT take screenshots for general tasks, coding, research, or anything that doesn't need the screen`,
|
|
3502
|
+
`- Only screenshot when you genuinely cannot proceed without seeing the current screen state`,
|
|
3503
|
+
`- Prefer find_and_click, hotkey, open_url, and type over repeated screenshots`,
|
|
3504
|
+
`- Max 2 screenshots per task \u2014 if you've already seen the screen, act on that knowledge`,
|
|
3504
3505
|
`- Use find_and_click to click on text by name rather than guessing coordinates`,
|
|
3505
3506
|
`- Use hotkey for keyboard shortcuts: "cmd+c", "ctrl+v", "alt+tab", "cmd+space"`,
|
|
3507
|
+
`- To open a website: use open_url \u2014 it reuses the existing browser tab`,
|
|
3506
3508
|
...hasMemory ? [
|
|
3507
3509
|
``,
|
|
3508
3510
|
`Memory (CRITICAL \u2014 write EVERYTHING you learn):`,
|