0agent 1.0.64 → 1.0.66

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2) hide show
  1. package/dist/daemon.mjs +16 -7
  2. package/package.json +1 -1
package/dist/daemon.mjs CHANGED
@@ -3371,8 +3371,9 @@ var init_CapabilityRegistry = __esm({
3371
3371
  active.add("scrape_url");
3372
3372
  active.add("browser_open");
3373
3373
  }
3374
- if (/click|screenshot|ui|desktop|window|screen|gui|mouse|keyboard|open.*app|fill.*form|navigate.*browser|interact|automate|computer.*use/i.test(lower)) {
3374
+ if (/click|screenshot|ui|desktop|window|screen|gui|mouse|keyboard|open.*app|fill.*form|navigate.*browser|interact|automate|computer.*use|whatsapp|telegram|youtube|music|play|send.*message/i.test(lower)) {
3375
3375
  active.add("computer_use");
3376
+ active.add("gui_automation");
3376
3377
  }
3377
3378
  return [...this.capabilities.values()].filter((c) => active.has(c.name)).map((c) => c.toolDefinition);
3378
3379
  }
@@ -3782,12 +3783,20 @@ content = element.text if element else page.get_all_text()` : `content = page.ge
3782
3783
  if (hasGUI) {
3783
3784
  lines.push(
3784
3785
  ``,
3785
- `Computer use: use computer_use for any desktop/browser/keyboard/mouse task.`,
3786
- `Pass a plain-English task description \u2014 e.g. {task: "Open WhatsApp, search for Sahil Godara, send Hi"}.`,
3787
- `DO NOT split into separate tool calls \u2014 describe the full end-to-end goal in ONE computer_use call.`,
3788
- `DO NOT ask for confirmation before computer_use \u2014 execute immediately.`,
3789
- `For messaging apps (WhatsApp, Telegram, iMessage): use computer_use directly, no confirmation needed.`,
3790
- `After computer_use, verify success by calling it again with task="take a screenshot and describe what you see".`
3786
+ `GUI/Browser rules:`,
3787
+ `1. open_url now returns actual URL + title + video state \u2014 read this output to know what really loaded.`,
3788
+ ` If it says "Title: YouTube Music" (homepage) instead of the song, navigation failed \u2014 fix it.`,
3789
+ `2. exec_js: run JavaScript in the current Chrome tab WITHOUT Screen Recording permission.`,
3790
+ ` Use it to interact with pages: click buttons, fill inputs, read state.`,
3791
+ ` Examples: {action:"exec_js",js:"document.querySelector('video').paused"}`,
3792
+ ` {action:"exec_js",js:"document.querySelector('.ytmusic-play-button-renderer').click()"}`,
3793
+ `3. browser_state: get current tab URL + title quickly \u2014 call after any navigation to verify.`,
3794
+ `4. NEVER claim a task succeeded based on the action alone. Read the tool output and verify:`,
3795
+ ` - "PLAYING:1.4s \u2713" \u2192 video is playing`,
3796
+ ` - "PAUSED" \u2192 video is NOT playing, take corrective action`,
3797
+ ` - "Title: Search results" \u2192 you're on search page, not the song \u2014 fix it`,
3798
+ `5. computer_use: for multi-step desktop tasks \u2014 pass full goal as {task:"..."}.`,
3799
+ ` DO NOT ask for confirmation \u2014 execute immediately.`
3791
3800
  );
3792
3801
  }
3793
3802
  if (isSelfMod && this.agentRoot) {
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "0agent",
3
- "version": "1.0.64",
3
+ "version": "1.0.66",
4
4
  "description": "A persistent, learning AI agent that runs on your machine. An agent that learns.",
5
5
  "private": false,
6
6
  "license": "Apache-2.0",