0agent 1.0.65 → 1.0.67

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2) hide show
  1. package/dist/daemon.mjs +16 -7
  2. package/package.json +1 -1
package/dist/daemon.mjs CHANGED
@@ -3371,8 +3371,9 @@ var init_CapabilityRegistry = __esm({
3371
3371
  active.add("scrape_url");
3372
3372
  active.add("browser_open");
3373
3373
  }
3374
- if (/click|screenshot|ui|desktop|window|screen|gui|mouse|keyboard|open.*app|fill.*form|navigate.*browser|interact|automate|computer.*use/i.test(lower)) {
3374
+ if (/click|screenshot|ui|desktop|window|screen|gui|mouse|keyboard|open.*app|fill.*form|navigate.*browser|interact|automate|computer.*use|whatsapp|telegram|youtube|music|play|pause|resume|stop|skip|next.*track|prev|send.*message/i.test(lower)) {
3375
3375
  active.add("computer_use");
3376
+ active.add("gui_automation");
3376
3377
  }
3377
3378
  return [...this.capabilities.values()].filter((c) => active.has(c.name)).map((c) => c.toolDefinition);
3378
3379
  }
@@ -3782,12 +3783,20 @@ content = element.text if element else page.get_all_text()` : `content = page.ge
3782
3783
  if (hasGUI) {
3783
3784
  lines.push(
3784
3785
  ``,
3785
- `Computer use: use computer_use for any desktop/browser/keyboard/mouse task.`,
3786
- `Pass a plain-English task description \u2014 e.g. {task: "Open WhatsApp, search for Sahil Godara, send Hi"}.`,
3787
- `DO NOT split into separate tool calls \u2014 describe the full end-to-end goal in ONE computer_use call.`,
3788
- `DO NOT ask for confirmation before computer_use \u2014 execute immediately.`,
3789
- `For messaging apps (WhatsApp, Telegram, iMessage): use computer_use directly, no confirmation needed.`,
3790
- `After computer_use, verify success by calling it again with task="take a screenshot and describe what you see".`
3786
+ `GUI/Browser rules:`,
3787
+ `1. open_url returns actual URL + title + "Video: PLAYING:1.4s \u2713" or "Video: PAUSED".`,
3788
+ ` Read it. If video is PAUSED or title shows wrong page \u2014 take corrective action.`,
3789
+ `2. exec_js: run JS in the current Chrome tab \u2014 NO Screen Recording needed.`,
3790
+ ` MEDIA CONTROL \u2192 always use exec_js, never hotkey (hotkeys go to Terminal not Chrome):`,
3791
+ ` pause: {action:"exec_js",js:"document.querySelector('video').pause()"}`,
3792
+ ` play: {action:"exec_js",js:"document.querySelector('video').play()"}`,
3793
+ ` check: {action:"exec_js",js:"document.querySelector('video').paused+' t='+document.querySelector('video').currentTime"}`,
3794
+ ` click: {action:"exec_js",js:"document.querySelector('.some-selector').click()"}`,
3795
+ `3. hotkey with app param: {action:"hotkey",keys:"k",app:"Google Chrome"} focuses Chrome first,`,
3796
+ ` then sends the key via AppleScript (reliable). Without app param, key goes to Terminal.`,
3797
+ `4. browser_state: quickly verify current tab URL + title after any navigation.`,
3798
+ `5. NEVER claim success based on action alone. exec_js to verify: video.paused, page title, etc.`,
3799
+ `6. computer_use: for multi-step desktop tasks \u2014 {task:"full goal description"}. No confirmation.`
3791
3800
  );
3792
3801
  }
3793
3802
  if (isSelfMod && this.agentRoot) {
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "0agent",
3
- "version": "1.0.65",
3
+ "version": "1.0.67",
4
4
  "description": "A persistent, learning AI agent that runs on your machine. An agent that learns.",
5
5
  "private": false,
6
6
  "license": "Apache-2.0",