npm - assistme - Versions diffs - 0.8.10 → 0.8.11 - Mend

assistme 0.8.10 → 0.8.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/dist/{chunk-HY3FFXSQ.js → chunk-BGMIIZLF.js} +2 -2
package/dist/{chunk-T3DBLWUW.js → chunk-RJBLIGFJ.js} +65 -4
package/dist/{chunk-QGH5MFJA.js → chunk-RUP2IQG3.js} +19 -3
package/dist/{config-2HH7PO34.js → config-V2EJC3EH.js} +1 -1
package/dist/index.js +10 -12
package/dist/job-runner-OT3HZQEF.js +7 -0
package/dist/workers/entry.js +77 -14
package/package.json +1 -1
package/src/agent/event-hooks.ts +15 -2
package/src/agent/job-runner.ts +14 -3
package/src/agent/system-prompt.ts +22 -0
package/src/browser/controller.ts +73 -3
package/src/db/types.ts +1 -0
package/src/mcp/agent-tools-server.ts +31 -8
package/src/orchestrator.ts +7 -6
package/src/utils/config.ts +2 -2
package/src/utils/schemas.ts +2 -0
package/tests/agent/event-hooks.test.ts +1 -0
package/tests/agent/processor.test.ts +11 -0
package/tests/utils/config.test.ts +1 -1
package/dist/job-runner-IBVUDW6A.js +0 -7

package/dist/{chunk-HY3FFXSQ.js → chunk-BGMIIZLF.js} RENAMED Viewed

@@ -30,7 +30,7 @@ var CONFIG_DEFAULTS = {
   supabaseAnonKey: SUPABASE_ANON_KEY_DEFAULT,
   sessionName: "Default",
   model: "claude-sonnet-4-20250514",
-  taskTimeoutMinutes: 10
+  taskTimeoutMinutes: 0
 };
 var config = new Conf({
   projectName: "assistme",
@@ -48,7 +48,7 @@ function getConfig() {
     workspacePath: resolve(workspacePath),
     sessionName: config.get("sessionName") || "Default",
     model: config.get("model") || "claude-sonnet-4-20250514",
-    taskTimeoutMinutes: config.get("taskTimeoutMinutes") || 10
+    taskTimeoutMinutes: config.get("taskTimeoutMinutes") ?? 0
   };
 }
 function setConfig(key, value) {

package/dist/{chunk-T3DBLWUW.js → chunk-RJBLIGFJ.js} RENAMED Viewed

@@ -17,13 +17,13 @@ import {
   readAuthStore,
   safeParse,
   writeAuthStore
-} from "./chunk-QGH5MFJA.js";
+} from "./chunk-RUP2IQG3.js";
 import {
   AppError,
   errorMessage,
   getConfig,
   getDataDir
-} from "./chunk-HY3FFXSQ.js";
+} from "./chunk-BGMIIZLF.js";
 // src/db/auth.ts
 async function loginWithToken(mcpToken) {
@@ -53,7 +53,7 @@ async function logout() {
 // src/db/session.ts
 async function createSession(sessionName, workspacePath, version) {
-  const { getConfig: getConfig2 } = await import("./config-2HH7PO34.js");
+  const { getConfig: getConfig2 } = await import("./config-V2EJC3EH.js");
   const data = await callMcpHandler("session.create", {
     session_name: sessionName,
     workspace_path: workspacePath,
@@ -386,6 +386,8 @@ var BrowserController = class {
   // ── Navigation ──────────────────────────────────────────────────
   async navigate(url) {
     this.ensureConnected();
+    this.refCache.clear();
+    this.frameContexts.clear();
     await this.send("Page.navigate", { url });
     await this.waitForLoad();
     const info = await this.getPageInfo();
@@ -394,6 +396,8 @@ URL: ${info.url}`;
   }
   async goBack() {
     this.ensureConnected();
+    this.refCache.clear();
+    this.frameContexts.clear();
     try {
       const history = await this.send("Page.getNavigationHistory");
       const idx = history.currentIndex ?? 0;
@@ -414,6 +418,8 @@ URL: ${info.url}`;
   }
   async reload() {
     this.ensureConnected();
+    this.refCache.clear();
+    this.frameContexts.clear();
     await this.send("Page.reload");
     await this.waitForLoad();
     return "Page reloaded.";
@@ -1332,6 +1338,47 @@ Refs:
       return null;
     }
   }
+  // ── Overlay Dismissal ────────────────────────────────────────────
+  /**
+   * Attempt to dismiss popups/overlays blocking interaction.
+   * Tries Escape key first, then common close button patterns.
+   * Called automatically when clickRef detects an element is covered.
+   */
+  async tryDismissOverlay() {
+    try {
+      await this.pressKey("Escape");
+      await new Promise((r) => setTimeout(r, 300));
+      await this.send("Runtime.evaluate", {
+        expression: `
+          (function() {
+            var selectors = [
+              'button[aria-label="Close"]', 'button[aria-label="close"]',
+              'button[aria-label="Dismiss"]', 'button[aria-label="dismiss"]',
+              '[role="dialog"] button[aria-label*="close" i]',
+              '[role="dialog"] button[aria-label*="dismiss" i]',
+              '[data-dismiss]', '[data-close]',
+              '.modal-close', '[class*="close-button"]',
+              '[class*="CloseButton"]', '[class*="dismiss"]',
+            ];
+            for (var i = 0; i < selectors.length; i++) {
+              try {
+                var btn = document.querySelector(selectors[i]);
+                if (btn && btn.offsetParent !== null) {
+                  btn.click();
+                  return 'clicked';
+                }
+              } catch(e) {}
+            }
+            return 'none';
+          })()
+        `,
+        returnByValue: true
+      });
+      return true;
+    } catch {
+      return false;
+    }
+  }
   // ── Ref-based Interactions (CDP Input Events) ─────────────────────
   /**
    * Click an element by ref using CDP Input.dispatchMouseEvent.
@@ -1342,6 +1389,8 @@ Refs:
    * Includes auto-wait: retries up to 3 times (with 500ms intervals) if the
    * element is not yet actionable (e.g., covered by a loading overlay, still
    * animating into view). This matches Playwright's auto-waiting behavior.
+   * When an element is covered by an overlay, auto-dismiss is attempted
+   * (Escape key + common close buttons) before retrying.
    */
   async clickRef(refId) {
     this.ensureConnected();
@@ -1359,6 +1408,11 @@ Refs:
       }
       if (resolved.error) {
         lastError = resolved.error;
+        if (resolved.error.includes("Element is covered by") && attempt < maxRetries - 1) {
+          await this.tryDismissOverlay();
+          await new Promise((r) => setTimeout(r, 500));
+          continue;
+        }
         if (attempt < maxRetries - 1) {
           await new Promise((r) => setTimeout(r, 500));
           continue;
@@ -1542,7 +1596,14 @@ Refs:
         result,
         success
       });
-      if (!success) break;
+      if (!success) {
+        results.push({
+          action: "hint",
+          result: "Refs may be stale after failure. Use browser_snapshot to get fresh refs before retrying.",
+          success: true
+        });
+        break;
+      }
       if (spec.action !== "wait") {
         await new Promise((r) => setTimeout(r, 200));
       }

package/dist/{chunk-QGH5MFJA.js → chunk-RUP2IQG3.js} RENAMED Viewed

@@ -2,7 +2,7 @@ import {
   errorMessage,
   getConfig,
   getDataDir
-} from "./chunk-HY3FFXSQ.js";
+} from "./chunk-BGMIIZLF.js";
 // src/db/auth-store.ts
 import { existsSync, readFileSync, writeFileSync } from "fs";
@@ -240,6 +240,7 @@ var JobRowSchema = z.object({
   job_id: z.string(),
   job_name: z.string(),
   job_description: z.string().optional().default(""),
+  job_prompt: z.string().optional().nullable(),
   skill_id: z.string().optional().nullable(),
   skill_name: z.string().optional().nullable(),
   skill_description: z.string().optional().default(""),
@@ -250,6 +251,7 @@ var JobListRowSchema = z.object({
   id: z.string(),
   name: z.string(),
   description: z.string().optional().default(""),
+  prompt: z.string().optional().nullable(),
   skill_count: z.number().optional().default(0)
 });
 var JobRunRowSchema = z.object({
@@ -373,6 +375,7 @@ var JobRunner = class {
         jobId: first.job_id,
         jobName: first.job_name,
         jobDescription: first.job_description,
+        jobPrompt: first.job_prompt ?? null,
         skills: rows.filter((row) => row.skill_id).map((row) => ({
           skillId: row.skill_id,
           skillName: row.skill_name || "",
@@ -469,7 +472,12 @@ var JobRunner = class {
     prompt += `**Name:** ${job.jobName}
 `;
     prompt += `**Description:** ${job.jobDescription}
+`;
+    if (job.jobPrompt) {
+      prompt += `**Current Execution Prompt:** ${job.jobPrompt}
+`;
+    }
+    prompt += `
 `;
     if (job.skills.length > 0) {
       prompt += `**Current Skills:**
@@ -510,9 +518,10 @@ var JobRunner = class {
    * chain them based on what it discovers at runtime.
    */
   buildJobPrompt(job, runId) {
+    const effectiveDescription = job.jobPrompt || job.jobDescription;
     let prompt = `## Job: ${job.jobName}
 `;
-    prompt += `*${job.jobDescription}*
+    prompt += `*${effectiveDescription}*
 `;
     prompt += `**Run ID:** ${runId}
@@ -536,12 +545,17 @@ var JobRunner = class {
     }
     prompt += `
 ### How to Work
+`;
+    prompt += `- **Plan first**: Before jumping into actions, briefly plan your approach \u2014 which sites/tools to use, in what order, and how to verify results.
 `;
     prompt += `- **Be agentic**: Decide what to do based on what you discover. `;
     prompt += `If checking Slack reveals a request that requires GitHub work, go do the GitHub work immediately \u2014 don't just note it for later.
 `;
     prompt += `- **Chain dynamically**: One skill's output should inform your next action. `;
     prompt += `For example, if you find an assigned GitHub issue, use your coding skills to implement it.
+`;
+    prompt += `- **Use separate tabs for different sites**: When working across multiple websites, open each in its own tab (browser_new_tab). `;
+    prompt += `This preserves page state and avoids re-navigation. Use browser_switch_tab to move between them.
 `;
     prompt += `- **Skip what's irrelevant**: If a capability doesn't apply right now, skip it.
 `;
@@ -550,6 +564,8 @@ var JobRunner = class {
 `;
     prompt += `- **Respond and act**: If you find messages or issues that need replies, reply to them. `;
     prompt += `If you find code tasks, implement them.
+`;
+    prompt += `- **Handle auth walls**: If a site requires login, use browser_request_user_action immediately \u2014 do not waste attempts trying to bypass auth walls.
 `;
     prompt += `When finished, provide a summary of what you accomplished and any items that need the user's attention.

package/dist/{config-2HH7PO34.js → config-V2EJC3EH.js} RENAMED Viewed

@@ -7,7 +7,7 @@ import {
   getDataDir,
   resetDirCaches,
   setConfig
-} from "./chunk-HY3FFXSQ.js";
+} from "./chunk-BGMIIZLF.js";
 export {
   assertWithinAssistMeRoot,
   clearConfig,

package/dist/index.js CHANGED Viewed

@@ -27,7 +27,7 @@ import {
   setSessionBusy,
   toggleScheduledTask,
   updateHeartbeat
-} from "./chunk-T3DBLWUW.js";
+} from "./chunk-RJBLIGFJ.js";
 import {
   HEARTBEAT_INTERVAL_MS,
   HEARTBEAT_LOG_MAX_ENTRIES,
@@ -39,7 +39,7 @@ import {
   setLogConversationId,
   setLogHook,
   setLogLevel
-} from "./chunk-QGH5MFJA.js";
+} from "./chunk-RUP2IQG3.js";
 import {
   clearConfig,
   errorMessage,
@@ -47,7 +47,7 @@ import {
   getConfigPath,
   getDataDir,
   setConfig
-} from "./chunk-HY3FFXSQ.js";
+} from "./chunk-BGMIIZLF.js";
 // src/index.ts
 import { Command } from "commander";
@@ -1500,12 +1500,10 @@ var Orchestrator = class {
       await this.dispatchAndWait(`[JobRun: ${jobRun.job_name}] ${prompt}`);
       await runner.completeRun(jobRun.id, "completed", "Job executed via web trigger");
     } catch (err) {
-      log.error(`Job run failed: ${err}`);
-      await runner.completeRun(
-        jobRun.id,
-        "failed",
-        `Execution error: ${err instanceof Error ? err.message : err}`
-      ).catch((e) => log.error(`Failed to mark run as failed: ${e}`));
+      const errMsg = err instanceof Error ? err.message : String(err);
+      log.error(`Job run failed: ${errMsg}`);
+      const summary = errMsg.includes("cancelled") ? `Cancelled by user. Check workspace for any partial results.` : `Execution error: ${errMsg}`;
+      await runner.completeRun(jobRun.id, "failed", summary).catch((e) => log.error(`Failed to mark run as failed: ${e}`));
     }
   }
   // ── Busy State ──────────────────────────────────────────────────
@@ -2237,7 +2235,7 @@ function registerJobCommands(program2) {
   jobCmd.command("list").description("List your defined jobs").action(async () => {
     try {
       await getCurrentUserId();
-      const { JobRunner: JobRunner2 } = await import("./job-runner-IBVUDW6A.js");
+      const { JobRunner: JobRunner2 } = await import("./job-runner-OT3HZQEF.js");
       const runner = new JobRunner2();
       const jobs = await runner.listJobs();
       if (jobs.length === 0) {
@@ -2261,7 +2259,7 @@ function registerJobCommands(program2) {
   jobCmd.command("status [name]").description("Show run history for a job (or all jobs)").option("-l, --limit <number>", "Max runs to show (default: 5)").action(async (name, opts) => {
     try {
       await getCurrentUserId();
-      const { JobRunner: JobRunner2 } = await import("./job-runner-IBVUDW6A.js");
+      const { JobRunner: JobRunner2 } = await import("./job-runner-OT3HZQEF.js");
       const runner = new JobRunner2();
       const runs = await runner.getRunHistory(name, parseInt(opts.limit || "5"));
       if (runs.length === 0) {
@@ -2300,7 +2298,7 @@ Job Run History${name ? ` \u2014 ${name}` : ""}:`));
         process.exit(1);
       }
       await getCurrentUserId();
-      const { JobRunner: JobRunner2 } = await import("./job-runner-IBVUDW6A.js");
+      const { JobRunner: JobRunner2 } = await import("./job-runner-OT3HZQEF.js");
       const runner = new JobRunner2();
       const job = await runner.loadJob(name);
       if (!job) {

package/dist/job-runner-OT3HZQEF.js ADDED Viewed

@@ -0,0 +1,7 @@
+import {
+  JobRunner
+} from "./chunk-RUP2IQG3.js";
+import "./chunk-BGMIIZLF.js";
+export {
+  JobRunner
+};

package/dist/workers/entry.js CHANGED Viewed

@@ -20,7 +20,7 @@ import {
   resetEventSequence,
   setActionRequest,
   upsertAgentSkill
-} from "../chunk-T3DBLWUW.js";
+} from "../chunk-RJBLIGFJ.js";
 import {
   EDSGER_PRODUCT_SLUG,
   JobRunner,
@@ -47,14 +47,14 @@ import {
   safeParse,
   setCorrelationId,
   setLogTransport
-} from "../chunk-QGH5MFJA.js";
+} from "../chunk-RUP2IQG3.js";
 import {
   AppError,
   assertWithinAssistMeRoot,
   errorMessage,
   getAssistMeRoot,
   getConfig
-} from "../chunk-HY3FFXSQ.js";
+} from "../chunk-BGMIIZLF.js";
 // src/workers/conversation.ts
 import { config as loadEnv } from "dotenv";
@@ -1708,7 +1708,9 @@ function createAgentToolsServer(deps) {
         {
           name: z2.string().describe("Skill name in kebab-case, e.g. 'flight-booking'"),
           description: z2.string().describe("One-line description of what this skill does"),
-          instructions: z2.string().describe("Markdown step-by-step instructions"),
+          instructions: z2.string().describe(
+            "Markdown step-by-step instructions. IMPORTANT: When a skill produces document output (reports, summaries, etc.), instruct it to generate .docx/.xlsx/.pptx files (not .md), so end users can open and edit them."
+          ),
           emoji: z2.string().optional().describe("Single emoji representing this skill")
         },
         async (args) => {
@@ -1984,14 +1986,38 @@ Use \`ask_user\` to request these from the user, or create them yourself (e.g. r
 `;
           }
-          response += `**Your task:** Analyze this job description and decompose it into 4-10 automatable skills.
+          response += `**Your task:** Analyze this job description and do TWO things:
+`;
+          response += `- **A. Rewrite the description into a professional, structured prompt** that clearly defines the job's objectives, scope, and expected outcomes. This will be used as the actual execution prompt when running the job. Store it as the \`prompt\` parameter when calling \`skill_link_job\`.
+`;
+          response += `- **B. Decompose the job into 4-10 automatable skills.**
 `;
-          response += `**IMPORTANT \u2014 You MUST use ask_user before creating skills:**
+          response += `**Example \u2014 Task A (professional prompt rewrite):**
+`;
+          response += `> User description: "\u6211\u662F\u7535\u5546\u8FD0\u8425\uFF0C\u6BCF\u5929\u770B\u7ADE\u54C1\u4EF7\u683C\u3001\u5199\u6587\u6848\u3001\u56DE\u590D\u8BC4\u8BBA"
+`;
+          response += `> Professional prompt:
 `;
-          response += `1. Analyze the job and draft a list of proposed skills (name, emoji, one-line description for each).
+          response += `> \u4F5C\u4E3A\u7535\u5546\u8FD0\u8425\u4E13\u5458\uFF0C\u7CFB\u7EDF\u6027\u5730\u6267\u884C\u4EE5\u4E0B\u6838\u5FC3\u65E5\u5E38\u804C\u8D23\uFF1A
 `;
-          response += `2. Call \`ask_user\` with the formatted skill list as "question" and these options:
+          response += `> 1. \u7ADE\u54C1\u4EF7\u683C\u76D1\u63A7 \u2014 \u91C7\u96C6\u4E3B\u8981\u7ADE\u54C1\u5728\u5404\u7535\u5546\u5E73\u53F0\u7684\u5B9E\u65F6\u4EF7\u683C\uFF0C\u8BC6\u522B\u4EF7\u683C\u53D8\u52A8\u8D8B\u52BF\uFF0C\u751F\u6210\u5BF9\u6BD4\u62A5\u544A\uFF08.docx\uFF09
+`;
+          response += `> 2. \u5546\u54C1\u6587\u6848\u64B0\u5199 \u2014 \u6839\u636E\u4EA7\u54C1\u5356\u70B9\u3001\u76EE\u6807\u53D7\u4F17\u548C\u5E73\u53F0\u8C03\u6027\uFF0C\u64B0\u5199\u7B26\u5408 SEO \u89C4\u8303\u7684\u5546\u54C1\u6807\u9898\u4E0E\u63CF\u8FF0
+`;
+          response += `> 3. \u5BA2\u6237\u8BC4\u8BBA\u7BA1\u7406 \u2014 \u68C0\u67E5\u65B0\u589E\u5DEE\u8BC4\u4E0E\u54A8\u8BE2\uFF0C\u6309\u4F18\u5148\u7EA7\u5206\u7C7B\uFF0C\u8D77\u8349\u4E13\u4E1A\u56DE\u590D
+`;
+          response += `> \u5B8C\u6210\u540E\u6C47\u603B\u5F53\u65E5\u5DE5\u4F5C\u6458\u8981\uFF0C\u6807\u6CE8\u9700\u8981\u4EBA\u5DE5\u5173\u6CE8\u7684\u4E8B\u9879\u3002
+`;
+          response += `The prompt should be in the same language as the user's description. Keep it under 2000 characters.
+`;
+          response += `**Workflow (follow these steps in order):**
+`;
+          response += `1. Draft the professional prompt (task A) AND a list of proposed skills with name, emoji, one-line description each (task B).
+`;
+          response += `2. Call \`ask_user\` with both the rewritten prompt and the skill list as "question", and these options:
 `;
           response += `   - options: [{label: "Approve All", action_key: "approve_all", description: "Create all proposed skills"}, {label: "Cancel", action_key: "cancel", description: "Do not create any skills"}]
 `;
@@ -2014,7 +2040,7 @@ Use \`ask_user\` to request these from the user, or create them yourself (e.g. r
           response += `skill_create automatically adds the skill to the user's collection \u2014 no need to call skill_add.
 `;
-          response += `After ALL skills are created, call \`skill_link_job\` with job_name="${args.job_name}" and the list of created skill names to link them and mark the job as analyzed.
+          response += `After ALL skills are created, call \`skill_link_job\` with job_name="${args.job_name}", the list of created skill names, AND the professional prompt you drafted to link them and mark the job as analyzed.
 `;
           response += `**Guidelines for skill instructions:**
@@ -2028,6 +2054,8 @@ Use \`ask_user\` to request these from the user, or create them yourself (e.g. r
           response += `- Use placeholders like {query}, {date} for variable inputs
 `;
           response += `- Each skill should be a single, well-defined workflow (10-25 steps)
+`;
+          response += `- When a skill produces document output (reports, summaries, data exports), instruct it to generate .docx/.xlsx/.pptx files \u2014 NOT .md \u2014 so end users can open and edit them
 `;
           return { content: [{ type: "text", text: response }] };
         }
@@ -2038,11 +2066,14 @@ Use \`ask_user\` to request these from the user, or create them yourself (e.g. r
         {
           job_name: z2.string().describe("Name of the job to link skills to"),
           job_description: z2.string().describe("Job description (used if job doesn't exist yet)"),
-          skill_names: z2.array(z2.string()).describe("Names of skills to link to this job")
+          skill_names: z2.array(z2.string()).describe("Names of skills to link to this job"),
+          prompt: z2.string().optional().describe(
+            "Professional, structured rewrite of the job description (max 2000 chars). This becomes the actual execution prompt when running the job. Should clearly define objectives, scope, and expected outcomes."
+          )
         },
         async (args) => {
           try {
-            await saveJobToDb(args.job_name, args.job_description, args.skill_names);
+            await saveJobToDb(args.job_name, args.job_description, args.skill_names, args.prompt);
             log.success(
               `Job "${args.job_name}": linked ${args.skill_names.length} skills and marked as analyzed`
             );
@@ -2851,12 +2882,13 @@ ${message}`
     ]
   });
 }
-async function saveJobToDb(jobName, jobDescription, createdSkillNames) {
+async function saveJobToDb(jobName, jobDescription, createdSkillNames, prompt) {
   try {
     const data = await callMcpHandler("job.save_with_skills", {
       job_name: jobName,
       job_description: jobDescription,
-      skill_names: createdSkillNames
+      skill_names: createdSkillNames,
+      prompt: prompt || null
     });
     log.debug(
       `Job "${jobName}" saved via edge function (id: ${data}), ${createdSkillNames.length} skill(s) linked`
@@ -2921,12 +2953,21 @@ function createEventHooks(taskId, toolCallRecords, toolFailures = []) {
       error: errorStr.slice(0, 500),
       timestamp: Date.now()
     });
+    const sameToolFailures = toolFailures.filter((f) => f.toolName === displayName).length;
+    const isBrowser = displayName.startsWith("browser_");
+    const browserFailures = isBrowser ? toolFailures.filter((f) => f.toolName.startsWith("browser_")).length : 0;
     await emitEvent(taskId, "tool_failure", {
       name: displayName,
       error: errorStr.slice(0, 500),
-      failure_count: toolFailures.filter((f) => f.toolName === displayName).length
+      failure_count: sameToolFailures,
+      browser_failure_count: browserFailures
     });
     log.warn(`Tool failure tracked: ${displayName} (total: ${toolFailures.length})`);
+    if (isBrowser && browserFailures >= 3 && browserFailures % 3 === 0) {
+      await emitEvent(taskId, "tool_failure_hint", {
+        message: `${browserFailures} browser tool failures detected. Consider: (1) re-snapshot to get fresh refs, (2) use separate tabs for different sites, (3) navigate directly to target URLs to bypass popups, (4) use browser_request_user_action for login walls.`
+      });
+    }
     return {};
   };
   return {
@@ -3124,6 +3165,13 @@ Workflow for web tasks (e.g. "\u67E5\u4E00\u4E0B kindle \u6700\u65B0\u6B3E\u4EF7
 6. Repeat 4-5 as needed (re-snapshot after navigation or major page changes)
 7. Summarize findings
+Workflow for MULTI-SITE tasks (e.g. "\u5728 Seek \u627E\u5DE5\u4F5C\uFF0C\u7136\u540E\u53BB Immigration NZ \u9A8C\u8BC1\u96C7\u4E3B"):
+- ALWAYS use separate tabs for different websites. Do NOT navigate back and forth in one tab \u2014 you lose page state.
+- Open each site in its own tab: browser_new_tab \u2192 browser_navigate
+- Use browser_switch_tab to switch between sites
+- This preserves scroll position, form data, and search results on each site
+- Example: Tab 0 = Seek (job search), Tab 1 = Immigration NZ (employer check), Tab 2 = LinkedIn (research)
 Workflow for form filling (e.g. "\u6CE8\u518C\u4E00\u4E2A Gmail \u8D26\u53F7"):
 1. browser_connect + browser_navigate \u2192 go to the form page
 2. browser_snapshot \u2192 see all form fields with ref numbers
@@ -3140,6 +3188,21 @@ Workflow for form filling (e.g. "\u6CE8\u518C\u4E00\u4E2A Gmail \u8D26\u53F7"):
    - Browser approach too slow \u2192 consider building a script/CLI solution
    - One data source fails \u2192 try an alternative source
    - If stuck after 2 failed attempts at the same step, try a fundamentally different approach
+   - **Popup/overlay blocks interaction** \u2192 The system auto-tries Escape + close buttons. If that fails, navigate directly to the target URL (e.g. append search params to skip the homepage popup). Do NOT repeatedly try to click through the same overlay.
+   - **Login/auth wall** \u2192 Use browser_request_user_action to ask the user to log in. Use memory_store to remember which sites require login so you can warn the user upfront next time.
+   - **Stale refs after navigation** \u2192 Refs are automatically cleared on navigation. Always re-snapshot after browser_navigate, goBack, or reload. If browser_act returns a "hint" about stale refs, re-snapshot immediately.
+10. DOCUMENT OUTPUT FORMAT:
+   - When creating documents, reports, or deliverables for the user, ALWAYS prefer Microsoft Office formats (.docx for text documents, .xlsx for spreadsheets, .pptx for presentations) over Markdown (.md).
+   - Regular users need to open, read, and edit these files \u2014 Office formats are universally accessible.
+   - Use the Bash tool to install and run document-generation libraries as needed:
+     * Python: python-docx (Word), openpyxl (Excel), python-pptx (PowerPoint)
+     * Node.js: docx (Word), exceljs (Excel), pptx (PowerPoint)
+   - Only use Markdown when:
+     * The output is internal (e.g. README.md in a program directory, skill instructions)
+     * The user explicitly requests Markdown
+     * The content is a quick inline response in the conversation (not a standalone file)
+   - When writing .docx files, include proper formatting: headings, paragraphs, tables, bullet lists \u2014 not just plain text dumped into a Word file.
 Guidelines:
 - SELF-VERIFY before finishing: re-read modified files, take a final screenshot after browser actions, or re-check output to confirm correctness. Never assume success without confirming the end state.

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "assistme",
-  "version": "0.8.10",
+  "version": "0.8.11",
   "description": "AssistMe CLI Agent - AI-powered agentic assistant for code, browser, and automation",
   "type": "module",
   "main": "dist/index.js",

package/src/agent/event-hooks.ts CHANGED Viewed

@@ -34,7 +34,6 @@ export function stripMcpPrefix(toolName: string): string {
   return match ? match[1] : toolName;
 }
 /**
  * Create PreToolUse and PostToolUse hooks that emit events to Supabase.
  * These hooks let the web UI display tool activity in real-time.
@@ -113,14 +112,28 @@ export function createEventHooks(
       timestamp: Date.now(),
     });
+    const sameToolFailures = toolFailures.filter((f) => f.toolName === displayName).length;
+    const isBrowser = displayName.startsWith("browser_");
+    const browserFailures = isBrowser
+      ? toolFailures.filter((f) => f.toolName.startsWith("browser_")).length
+      : 0;
     await emitEvent(taskId, "tool_failure", {
       name: displayName,
       error: errorStr.slice(0, 500),
-      failure_count: toolFailures.filter((f) => f.toolName === displayName).length,
+      failure_count: sameToolFailures,
+      browser_failure_count: browserFailures,
     });
     log.warn(`Tool failure tracked: ${displayName} (total: ${toolFailures.length})`);
+    // Emit strategy hint when browser failures accumulate
+    if (isBrowser && browserFailures >= 3 && browserFailures % 3 === 0) {
+      await emitEvent(taskId, "tool_failure_hint", {
+        message: `${browserFailures} browser tool failures detected. Consider: (1) re-snapshot to get fresh refs, (2) use separate tabs for different sites, (3) navigate directly to target URLs to bypass popups, (4) use browser_request_user_action for login walls.`,
+      });
+    }
     return {};
   };

package/src/agent/job-runner.ts CHANGED Viewed

@@ -18,6 +18,7 @@ export interface JobInfo {
   jobId: string;
   jobName: string;
   jobDescription: string;
+  jobPrompt: string | null;
   skills: JobSkillInfo[];
 }
@@ -57,6 +58,7 @@ export class JobRunner {
         jobId: first.job_id,
         jobName: first.job_name,
         jobDescription: first.job_description,
+        jobPrompt: first.job_prompt ?? null,
         skills: rows
           .filter((row) => row!.skill_id)
           .map((row) => ({
@@ -172,7 +174,11 @@ export class JobRunner {
     let prompt = `Analyze this job definition and determine what skills are needed to execute it effectively.\n\n`;
     prompt += `## Job Definition\n`;
     prompt += `**Name:** ${job.jobName}\n`;
-    prompt += `**Description:** ${job.jobDescription}\n\n`;
+    prompt += `**Description:** ${job.jobDescription}\n`;
+    if (job.jobPrompt) {
+      prompt += `**Current Execution Prompt:** ${job.jobPrompt}\n`;
+    }
+    prompt += `\n`;
     if (job.skills.length > 0) {
       prompt += `**Current Skills:**\n`;
@@ -204,8 +210,9 @@ export class JobRunner {
    * chain them based on what it discovers at runtime.
    */
   buildJobPrompt(job: JobInfo, runId: string): string {
+    const effectiveDescription = job.jobPrompt || job.jobDescription;
     let prompt = `## Job: ${job.jobName}\n`;
-    prompt += `*${job.jobDescription}*\n\n`;
+    prompt += `*${effectiveDescription}*\n\n`;
     prompt += `**Run ID:** ${runId}\n\n`;
     prompt += `You are now acting as "${job.jobName}". `;
@@ -222,15 +229,19 @@ export class JobRunner {
     }
     prompt += `\n### How to Work\n`;
+    prompt += `- **Plan first**: Before jumping into actions, briefly plan your approach — which sites/tools to use, in what order, and how to verify results.\n`;
     prompt += `- **Be agentic**: Decide what to do based on what you discover. `;
     prompt += `If checking Slack reveals a request that requires GitHub work, go do the GitHub work immediately — don't just note it for later.\n`;
     prompt += `- **Chain dynamically**: One skill's output should inform your next action. `;
     prompt += `For example, if you find an assigned GitHub issue, use your coding skills to implement it.\n`;
+    prompt += `- **Use separate tabs for different sites**: When working across multiple websites, open each in its own tab (browser_new_tab). `;
+    prompt += `This preserves page state and avoids re-navigation. Use browser_switch_tab to move between them.\n`;
     prompt += `- **Skip what's irrelevant**: If a capability doesn't apply right now, skip it.\n`;
     prompt += `- **Use tools directly too**: You also have browser, file, and shell tools. `;
     prompt += `Use them directly when a skill isn't needed — skills are guides, not mandatory steps.\n`;
     prompt += `- **Respond and act**: If you find messages or issues that need replies, reply to them. `;
-    prompt += `If you find code tasks, implement them.\n\n`;
+    prompt += `If you find code tasks, implement them.\n`;
+    prompt += `- **Handle auth walls**: If a site requires login, use browser_request_user_action immediately — do not waste attempts trying to bypass auth walls.\n\n`;
     prompt += `When finished, provide a summary of what you accomplished and any items that need the user's attention.\n`;

package/src/agent/system-prompt.ts CHANGED Viewed

@@ -147,6 +147,13 @@ Workflow for web tasks (e.g. "查一下 kindle 最新款价格"):
 6. Repeat 4-5 as needed (re-snapshot after navigation or major page changes)
 7. Summarize findings
+Workflow for MULTI-SITE tasks (e.g. "在 Seek 找工作，然后去 Immigration NZ 验证雇主"):
+- ALWAYS use separate tabs for different websites. Do NOT navigate back and forth in one tab — you lose page state.
+- Open each site in its own tab: browser_new_tab → browser_navigate
+- Use browser_switch_tab to switch between sites
+- This preserves scroll position, form data, and search results on each site
+- Example: Tab 0 = Seek (job search), Tab 1 = Immigration NZ (employer check), Tab 2 = LinkedIn (research)
 Workflow for form filling (e.g. "注册一个 Gmail 账号"):
 1. browser_connect + browser_navigate → go to the form page
 2. browser_snapshot → see all form fields with ref numbers
@@ -163,6 +170,21 @@ Workflow for form filling (e.g. "注册一个 Gmail 账号"):
    - Browser approach too slow → consider building a script/CLI solution
    - One data source fails → try an alternative source
    - If stuck after 2 failed attempts at the same step, try a fundamentally different approach
+   - **Popup/overlay blocks interaction** → The system auto-tries Escape + close buttons. If that fails, navigate directly to the target URL (e.g. append search params to skip the homepage popup). Do NOT repeatedly try to click through the same overlay.
+   - **Login/auth wall** → Use browser_request_user_action to ask the user to log in. Use memory_store to remember which sites require login so you can warn the user upfront next time.
+   - **Stale refs after navigation** → Refs are automatically cleared on navigation. Always re-snapshot after browser_navigate, goBack, or reload. If browser_act returns a "hint" about stale refs, re-snapshot immediately.
+10. DOCUMENT OUTPUT FORMAT:
+   - When creating documents, reports, or deliverables for the user, ALWAYS prefer Microsoft Office formats (.docx for text documents, .xlsx for spreadsheets, .pptx for presentations) over Markdown (.md).
+   - Regular users need to open, read, and edit these files — Office formats are universally accessible.
+   - Use the Bash tool to install and run document-generation libraries as needed:
+     * Python: python-docx (Word), openpyxl (Excel), python-pptx (PowerPoint)
+     * Node.js: docx (Word), exceljs (Excel), pptx (PowerPoint)
+   - Only use Markdown when:
+     * The output is internal (e.g. README.md in a program directory, skill instructions)
+     * The user explicitly requests Markdown
+     * The content is a quick inline response in the conversation (not a standalone file)
+   - When writing .docx files, include proper formatting: headings, paragraphs, tables, bullet lists — not just plain text dumped into a Word file.
 Guidelines:
 - SELF-VERIFY before finishing: re-read modified files, take a final screenshot after browser actions, or re-check output to confirm correctness. Never assume success without confirming the end state.

package/src/browser/controller.ts CHANGED Viewed

@@ -199,6 +199,9 @@ export class BrowserController {
   async navigate(url: string): Promise<string> {
     this.ensureConnected();
+    // Clear refs from previous page — they become stale after navigation
+    this.refCache.clear();
+    this.frameContexts.clear();
     await this.send("Page.navigate", { url });
     // Wait for load
     await this.waitForLoad();
@@ -208,6 +211,8 @@ export class BrowserController {
   async goBack(): Promise<string> {
     this.ensureConnected();
+    this.refCache.clear();
+    this.frameContexts.clear();
     try {
       // Get navigation history and go to the previous entry
       const history = (await this.send("Page.getNavigationHistory")) as {
@@ -235,6 +240,8 @@ export class BrowserController {
   async reload(): Promise<string> {
     this.ensureConnected();
+    this.refCache.clear();
+    this.frameContexts.clear();
     await this.send("Page.reload");
     await this.waitForLoad();
     return "Page reloaded.";
@@ -1278,6 +1285,52 @@ export class BrowserController {
     }
   }
+  // ── Overlay Dismissal ────────────────────────────────────────────
+  /**
+   * Attempt to dismiss popups/overlays blocking interaction.
+   * Tries Escape key first, then common close button patterns.
+   * Called automatically when clickRef detects an element is covered.
+   */
+  private async tryDismissOverlay(): Promise<boolean> {
+    try {
+      // Strategy 1: Press Escape to dismiss modals/popups
+      await this.pressKey("Escape");
+      await new Promise((r) => setTimeout(r, 300));
+      // Strategy 2: Click common close/dismiss buttons
+      await this.send("Runtime.evaluate", {
+        expression: `
+          (function() {
+            var selectors = [
+              'button[aria-label="Close"]', 'button[aria-label="close"]',
+              'button[aria-label="Dismiss"]', 'button[aria-label="dismiss"]',
+              '[role="dialog"] button[aria-label*="close" i]',
+              '[role="dialog"] button[aria-label*="dismiss" i]',
+              '[data-dismiss]', '[data-close]',
+              '.modal-close', '[class*="close-button"]',
+              '[class*="CloseButton"]', '[class*="dismiss"]',
+            ];
+            for (var i = 0; i < selectors.length; i++) {
+              try {
+                var btn = document.querySelector(selectors[i]);
+                if (btn && btn.offsetParent !== null) {
+                  btn.click();
+                  return 'clicked';
+                }
+              } catch(e) {}
+            }
+            return 'none';
+          })()
+        `,
+        returnByValue: true,
+      });
+      return true;
+    } catch {
+      return false;
+    }
+  }
   // ── Ref-based Interactions (CDP Input Events) ─────────────────────
   /**
@@ -1289,6 +1342,8 @@ export class BrowserController {
    * Includes auto-wait: retries up to 3 times (with 500ms intervals) if the
    * element is not yet actionable (e.g., covered by a loading overlay, still
    * animating into view). This matches Playwright's auto-waiting behavior.
+   * When an element is covered by an overlay, auto-dismiss is attempted
+   * (Escape key + common close buttons) before retrying.
    */
   async clickRef(refId: number): Promise<RefActionResult> {
     this.ensureConnected();
@@ -1311,7 +1366,13 @@ export class BrowserController {
       if (resolved.error) {
         lastError = resolved.error;
-        // If element is covered or hidden, wait and retry (it might be animating)
+        // If element is covered by an overlay, try auto-dismissing it before retry
+        if (resolved.error.includes("Element is covered by") && attempt < maxRetries - 1) {
+          await this.tryDismissOverlay();
+          await new Promise((r) => setTimeout(r, 500));
+          continue;
+        }
+        // If element is hidden or other issue, wait and retry (it might be animating)
         if (attempt < maxRetries - 1) {
           await new Promise((r) => setTimeout(r, 500));
           continue;
@@ -1528,8 +1589,17 @@ export class BrowserController {
         success,
       });
-      // If an action failed, stop the batch (remaining refs may be stale)
-      if (!success) break;
+      // If an action failed, stop the batch (remaining refs may be stale).
+      // Append re-snapshot hint to help the agent recover.
+      if (!success) {
+        results.push({
+          action: "hint",
+          result:
+            "Refs may be stale after failure. Use browser_snapshot to get fresh refs before retrying.",
+          success: true,
+        });
+        break;
+      }
       // Brief pause between actions for DOM to settle
       if (spec.action !== "wait") {

package/src/db/types.ts CHANGED Viewed

@@ -49,6 +49,7 @@ export type EventType =
   | "tool_use_input"
   | "tool_result"
   | "tool_failure"
+  | "tool_failure_hint"
   | "thinking"
   | "error"
   | "status_change"

package/src/mcp/agent-tools-server.ts CHANGED Viewed

@@ -92,7 +92,11 @@ export function createAgentToolsServer(deps: AgentToolsDeps): McpSdkServerConfig
         {
           name: z.string().describe("Skill name in kebab-case, e.g. 'flight-booking'"),
           description: z.string().describe("One-line description of what this skill does"),
-          instructions: z.string().describe("Markdown step-by-step instructions"),
+          instructions: z.string().describe(
+            "Markdown step-by-step instructions. " +
+            "IMPORTANT: When a skill produces document output (reports, summaries, etc.), " +
+            "instruct it to generate .docx/.xlsx/.pptx files (not .md), so end users can open and edit them."
+          ),
           emoji: z.string().optional().describe("Single emoji representing this skill"),
         },
         async (args) => {
@@ -400,10 +404,21 @@ export function createAgentToolsServer(deps: AgentToolsDeps): McpSdkServerConfig
             response += `**Existing skills (do NOT duplicate):** ${existingNames.join(", ")}\n\n`;
           }
-          response += `**Your task:** Analyze this job description and decompose it into 4-10 automatable skills.\n\n`;
-          response += `**IMPORTANT — You MUST use ask_user before creating skills:**\n`;
-          response += `1. Analyze the job and draft a list of proposed skills (name, emoji, one-line description for each).\n`;
-          response += `2. Call \`ask_user\` with the formatted skill list as "question" and these options:\n`;
+          response += `**Your task:** Analyze this job description and do TWO things:\n`;
+          response += `- **A. Rewrite the description into a professional, structured prompt** that clearly defines the job's objectives, scope, and expected outcomes. This will be used as the actual execution prompt when running the job. Store it as the \`prompt\` parameter when calling \`skill_link_job\`.\n`;
+          response += `- **B. Decompose the job into 4-10 automatable skills.**\n\n`;
+          response += `**Example — Task A (professional prompt rewrite):**\n`;
+          response += `> User description: "我是电商运营，每天看竞品价格、写文案、回复评论"\n`;
+          response += `> Professional prompt:\n`;
+          response += `> 作为电商运营专员，系统性地执行以下核心日常职责：\n`;
+          response += `> 1. 竞品价格监控 — 采集主要竞品在各电商平台的实时价格，识别价格变动趋势，生成对比报告（.docx）\n`;
+          response += `> 2. 商品文案撰写 — 根据产品卖点、目标受众和平台调性，撰写符合 SEO 规范的商品标题与描述\n`;
+          response += `> 3. 客户评论管理 — 检查新增差评与咨询，按优先级分类，起草专业回复\n`;
+          response += `> 完成后汇总当日工作摘要，标注需要人工关注的事项。\n\n`;
+          response += `The prompt should be in the same language as the user's description. Keep it under 2000 characters.\n\n`;
+          response += `**Workflow (follow these steps in order):**\n`;
+          response += `1. Draft the professional prompt (task A) AND a list of proposed skills with name, emoji, one-line description each (task B).\n`;
+          response += `2. Call \`ask_user\` with both the rewritten prompt and the skill list as "question", and these options:\n`;
           response += `   - options: [{label: "Approve All", action_key: "approve_all", description: "Create all proposed skills"}, {label: "Cancel", action_key: "cancel", description: "Do not create any skills"}]\n`;
           response += `3. WAIT for the response. If action_key is "approve_all", create all skills using \`skill_create\`. If "cancel", stop.\n`;
           response += `4. Do NOT ask for confirmation in text. Do NOT create skills without calling ask_user first.\n\n`;
@@ -413,13 +428,14 @@ export function createAgentToolsServer(deps: AgentToolsDeps): McpSdkServerConfig
           response += `- instructions: detailed step-by-step markdown instructions the agent can follow\n`;
           response += `- emoji: a single emoji representing the skill\n\n`;
           response += `skill_create automatically adds the skill to the user's collection — no need to call skill_add.\n\n`;
-          response += `After ALL skills are created, call \`skill_link_job\` with job_name="${args.job_name}" and the list of created skill names to link them and mark the job as analyzed.\n\n`;
+          response += `After ALL skills are created, call \`skill_link_job\` with job_name="${args.job_name}", the list of created skill names, AND the professional prompt you drafted to link them and mark the job as analyzed.\n\n`;
           response += `**Guidelines for skill instructions:**\n`;
           response += `- Write clear, actionable markdown steps\n`;
           response += `- Reference browser tools (browser_navigate, browser_click, browser_read_page, etc.) for web tasks\n`;
           response += `- Include error handling steps\n`;
           response += `- Use placeholders like {query}, {date} for variable inputs\n`;
           response += `- Each skill should be a single, well-defined workflow (10-25 steps)\n`;
+          response += `- When a skill produces document output (reports, summaries, data exports), instruct it to generate .docx/.xlsx/.pptx files — NOT .md — so end users can open and edit them\n`;
           return { content: [{ type: "text", text: response }] };
         }
@@ -431,10 +447,15 @@ export function createAgentToolsServer(deps: AgentToolsDeps): McpSdkServerConfig
           job_name: z.string().describe("Name of the job to link skills to"),
           job_description: z.string().describe("Job description (used if job doesn't exist yet)"),
           skill_names: z.array(z.string()).describe("Names of skills to link to this job"),
+          prompt: z.string().optional().describe(
+            "Professional, structured rewrite of the job description (max 2000 chars). " +
+            "This becomes the actual execution prompt when running the job. " +
+            "Should clearly define objectives, scope, and expected outcomes."
+          ),
         },
         async (args) => {
           try {
-            await saveJobToDb(args.job_name, args.job_description, args.skill_names);
+            await saveJobToDb(args.job_name, args.job_description, args.skill_names, args.prompt);
             log.success(
               `Job "${args.job_name}": linked ${args.skill_names.length} skills and marked as analyzed`
             );
@@ -1393,13 +1414,15 @@ export function createAgentToolsServer(deps: AgentToolsDeps): McpSdkServerConfig
 async function saveJobToDb(
   jobName: string,
   jobDescription: string,
-  createdSkillNames: string[]
+  createdSkillNames: string[],
+  prompt?: string
 ): Promise<void> {
   try {
     const data = await callMcpHandler("job.save_with_skills", {
       job_name: jobName,
       job_description: jobDescription,
       skill_names: createdSkillNames,
+      prompt: prompt || null,
     });
     log.debug(

package/src/orchestrator.ts CHANGED Viewed

@@ -226,13 +226,14 @@ export class Orchestrator {
       await this.dispatchAndWait(`[JobRun: ${jobRun.job_name}] ${prompt}`);
       await runner.completeRun(jobRun.id, "completed", "Job executed via web trigger");
     } catch (err) {
-      log.error(`Job run failed: ${err}`);
+      const errMsg = err instanceof Error ? err.message : String(err);
+      log.error(`Job run failed: ${errMsg}`);
+      // Preserve partial progress info in the summary
+      const summary = errMsg.includes("cancelled")
+        ? `Cancelled by user. Check workspace for any partial results.`
+        : `Execution error: ${errMsg}`;
       await runner
-        .completeRun(
-          jobRun.id,
-          "failed",
-          `Execution error: ${err instanceof Error ? err.message : err}`
-        )
+        .completeRun(jobRun.id, "failed", summary)
         .catch((e) => log.error(`Failed to mark run as failed: ${e}`));
     }
   }

package/src/utils/config.ts CHANGED Viewed

@@ -29,7 +29,7 @@ const CONFIG_DEFAULTS: Partial<AssistMeConfig> = {
   supabaseAnonKey: SUPABASE_ANON_KEY_DEFAULT,
   sessionName: "Default",
   model: "claude-sonnet-4-20250514",
-  taskTimeoutMinutes: 10,
+  taskTimeoutMinutes: 0,
 };
 const config = new Conf<Partial<AssistMeConfig>>({
@@ -51,7 +51,7 @@ export function getConfig(): AssistMeConfig {
     workspacePath: resolve(workspacePath),
     sessionName: config.get("sessionName") || "Default",
     model: config.get("model") || "claude-sonnet-4-20250514",
-    taskTimeoutMinutes: config.get("taskTimeoutMinutes") || 10,
+    taskTimeoutMinutes: config.get("taskTimeoutMinutes") ?? 0,
   };
 }

package/src/utils/schemas.ts CHANGED Viewed

@@ -53,6 +53,7 @@ export const JobRowSchema = z.object({
   job_id: z.string(),
   job_name: z.string(),
   job_description: z.string().optional().default(""),
+  job_prompt: z.string().optional().nullable(),
   skill_id: z.string().optional().nullable(),
   skill_name: z.string().optional().nullable(),
   skill_description: z.string().optional().default(""),
@@ -64,6 +65,7 @@ export const JobListRowSchema = z.object({
   id: z.string(),
   name: z.string(),
   description: z.string().optional().default(""),
+  prompt: z.string().optional().nullable(),
   skill_count: z.number().optional().default(0),
 });

package/tests/agent/event-hooks.test.ts CHANGED Viewed

@@ -206,6 +206,7 @@ describe("createEventHooks", () => {
         name: "Bash",
         error: "command not found: bad-cmd",
         failure_count: 1,
+        browser_failure_count: 0,
       });
     });

package/tests/agent/processor.test.ts CHANGED Viewed

@@ -39,6 +39,7 @@ vi.mock("../../src/utils/config.js", () => ({
     workspacePath: "/tmp/test-workspace",
     maxTurns: 10,
     anthropicApiKey: "sk-ant-test",
+    taskTimeoutMinutes: 0,
   }),
   getAssistMeRoot: () => "/tmp/test-workspace/assistme",
 }));
@@ -78,6 +79,7 @@ vi.mock("../../src/agent/memory.js", () => ({
   MemoryManager: class MockMemoryManager {
     buildMemoryPrompt = vi.fn().mockResolvedValue("");
     remember = mockRemember;
+    compressIfNeeded = vi.fn().mockResolvedValue(undefined);
   },
 }));
@@ -85,6 +87,7 @@ vi.mock("../../src/agent/skills.js", () => ({
   SkillManager: class MockSkillManager {
     setUserId = vi.fn();
     loadFromDb = vi.fn().mockResolvedValue(undefined);
+    ensureLoaded = vi.fn().mockResolvedValue(undefined);
     buildSkillPrompt = vi.fn().mockReturnValue("");
     buildSkillDescriptions = vi.fn().mockResolvedValue("");
     findRelevant = vi.fn().mockReturnValue([]);
@@ -136,6 +139,14 @@ vi.mock("../../src/agent/self-analyzer.js", () => ({
   analyzeSelfPostTask: vi.fn().mockResolvedValue(undefined),
 }));
+vi.mock("../../src/agent/prompt-builder.js", () => ({
+  buildSystemPrompt: vi.fn().mockResolvedValue("mock system prompt"),
+}));
+vi.mock("../../src/agent/skill-evaluator.js", () => ({
+  evaluateAndMaybeCreateSkill: vi.fn().mockResolvedValue(undefined),
+}));
 const { TaskProcessor } = await import("../../src/agent/processor.js");
 describe("TaskProcessor", () => {

package/tests/utils/config.test.ts CHANGED Viewed

@@ -50,7 +50,7 @@ describe("config module", () => {
     const config = getConfig();
     expect(config.sessionName).toBe("Default");
     expect(config.model).toBe("claude-sonnet-4-20250514");
-    expect(config.taskTimeoutMinutes).toBe(10);
+    expect(config.taskTimeoutMinutes).toBe(0);
   });
   it("resolves workspacePath to absolute path", () => {

package/dist/job-runner-IBVUDW6A.js DELETED Viewed

@@ -1,7 +0,0 @@
-import {
-  JobRunner
-} from "./chunk-QGH5MFJA.js";
-import "./chunk-HY3FFXSQ.js";
-export {
-  JobRunner
-};