npm - rl-simulator-core - Versions diffs - 1.0.8 → 1.2.0 - Mend

rl-simulator-core 1.0.8 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/index.d.mts CHANGED Viewed

@@ -1,6 +1,6 @@
+import { chromium } from 'playwright';
 import fs from 'fs';
 import path from 'path';
-import { chromium } from 'playwright';
 import { createOpenAI } from '@ai-sdk/openai';
 import { generateText } from 'ai';
 import dotenv from 'dotenv';
@@ -286,7 +286,7 @@ async function executeAction(page, action) {
     return 'CONTINUE';
 }
-async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo }) {
+async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo, browser: externalBrowser }) {
     console.log(`[Agent] Starting task: ${taskInput} on ${targetUrl} (Session: ${sessionId})`);
     const screenshotsDir = path.join(process.cwd(), 'screenshots');
@@ -295,11 +295,19 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
         console.log(`📁 创建截图目录: ${screenshotsDir}`);
     }
-    // 2. Launch Browser
-    const browser = await chromium.launch({
-        headless: true, // Visible for demo/debug
-        args: ['--start-maximized'] // Attempt to maximize
-    });
+    // 2. Launch Browser (or use existing)
+    let browser;
+    let shouldCloseBrowser = false;
+    if (externalBrowser) {
+        browser = externalBrowser;
+    } else {
+        browser = await chromium.launch({
+            headless: true, // Visible for demo/debug
+            args: ['--start-maximized'] // Attempt to maximize
+        });
+        shouldCloseBrowser = true;
+    }
     const context = await browser.newContext({
         viewport: { width: 430, height: 800 } // Set a reasonable fixed viewport
@@ -366,7 +374,33 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
             // 3. Query AI
             console.log("Querying AI...");
-            const aiContent = await queryAI(conversationHistory);
+            // Optimization: Window mode & Filter images
+            // 1. Keep last 20 rounds (40 messages) - Better memory than 3 rounds, but prevents infinite growth
+            let optimizedHistory = conversationHistory;
+            if (conversationHistory.length > 40) {
+                optimizedHistory = conversationHistory.slice(-40);
+            }
+            // 2. Filter images from older messages (Keep images only in the last 3 rounds / 6 messages)
+            // Strategy: "Fading Memory" - Recent = Full (Text+Img), Older = Text only
+            optimizedHistory = optimizedHistory.map((msg, index) => {
+                // Determine if this message is within the "recent 3 rounds" window
+                // length - 1 is the last item. length - 6 is the start of the last 3 rounds (User-AI, User-AI, User-AI)
+                const isRecent = index >= optimizedHistory.length - 6;
+                if (isRecent) return msg; // Keep recent messages intact (including images)
+                if (Array.isArray(msg.content)) {
+                    return {
+                        ...msg,
+                        content: msg.content.filter(c => c.type !== 'image')
+                    };
+                }
+                return msg;
+            });
+            const aiContent = await queryAI(optimizedHistory);
             if (!aiContent) {
                 console.error("Invalid AI response. Retrying...");
@@ -410,8 +444,13 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
         console.error("Runtime Custom Error:", error);
         return { status: 'error', message: error.message };
     } finally {
-        console.log("Closing browser...");
-        await browser.close();
+        if (shouldCloseBrowser) {
+            console.log("Closing browser...");
+            await browser.close();
+        } else {
+            console.log("Closing context...");
+            await context.close();
+        }
     }
 }
@@ -434,7 +473,6 @@ function getFormattedDate() {
  * @param {string} taskId - The ID of the task to run
  */
 async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAgent) {
-    const results = [];
     const datetime = getFormattedDate();
     const folderName = `${taskId}_${datetime}`;
     const outputDir = path.join(process.cwd(), folderName);
@@ -451,37 +489,59 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     console.log(`Starting Task Loop for ${taskId}`);
-    for (let i = 1; i <= 5; i++) {
-        console.log(`\n=== Starting Iteration ${i}/5 ===`);
-        try {
-            const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner);
-            const { sessionId, agentMessages, ...rest } = data;
-            // Create session subdirectory
-            const sessionDir = path.join(outputDir, sessionId);
-            if (!fs.existsSync(sessionDir)) {
-                fs.mkdirSync(sessionDir, { recursive: true });
-            }
+    // Launch a shared browser instance
+    const browser = await chromium.launch({
+        headless: true,
+        args: ['--start-maximized']
+    });
-            // Save messages.json
-            fs.writeFileSync(
-                path.join(sessionDir, 'messages.json'),
-                JSON.stringify(agentMessages, null, 2)
-            );
+    const results = [];
+    const MAX_CONCURRENCY = 5;
-            // Save result.json
-            fs.writeFileSync(
-                path.join(sessionDir, 'result.json'),
-                JSON.stringify(rest, null, 2)
-            );
+    try {
+        const promises = [];
+        for (let i = 1; i <= MAX_CONCURRENCY; i++) {
+            promises.push((async () => {
+                console.log(`\n=== Starting Iteration ${i}/${MAX_CONCURRENCY} ===`);
+                try {
+                    // Pass shared browser to executeSingleCycle
+                    const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner, browser);
+                    const { sessionId, agentMessages, ...rest } = data;
+                    // Create session subdirectory
+                    const sessionDir = path.join(outputDir, sessionId);
+                    if (!fs.existsSync(sessionDir)) {
+                        fs.mkdirSync(sessionDir, { recursive: true });
+                    }
+                    // Save messages.json
+                    fs.writeFileSync(
+                        path.join(sessionDir, 'messages.json'),
+                        JSON.stringify(agentMessages, null, 2)
+                    );
+                    // Save result.json
+                    fs.writeFileSync(
+                        path.join(sessionDir, 'result.json'),
+                        JSON.stringify(rest, null, 2)
+                    );
+                    console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+                    return { sessionId, ...rest };
+                } catch (e) {
+                    console.error(`Iteration ${i} failed:`, e.stack || e.message);
+                    return { iteration: i, error: e.message };
+                }
+            })());
+        }
-            results.push({ sessionId, ...rest });
-            console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+        // Wait for all to finish
+        const resultsArray = await Promise.all(promises);
+        results.push(...resultsArray);
-        } catch (e) {
-            console.error(`Iteration ${i} failed:`, e.stack || e.message);
-            results.push({ iteration: i, error: e.message });
-        }
+    } finally {
+        console.log("Closing shared browser...");
+        await browser.close();
     }
     // Save final-results.json (Consolidated)
@@ -489,7 +549,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     results.filter(r => r.verifyResult);
     const scores = results.map(r => r.verifyResult?.score || 0);
     const successCount = scores.filter(s => s === 1).length;
-    const total = 5; // Fixed 5 iterations
+    const total = MAX_CONCURRENCY;
     const rate = `${successCount}/${total}`;
     const summary = {
@@ -527,7 +587,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     };
 }
-async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner) {
+async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner, browser) {
     const fetchJson = async (url, opts) => {
         const res = await fetch(url, opts);
         if (!res.ok) {
@@ -562,7 +622,8 @@ async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, ag
         taskInput: TaskJson.task.instruction,
         targetUrl: targetWeb,
         sessionId: sessionId,
-        simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info
+        simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info,
+        browser: browser // Pass the shared browser instance
     });
     // 4. Verify Task

package/dist/index.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
+import { chromium } from 'playwright';
 import fs from 'fs';
 import path from 'path';
-import { chromium } from 'playwright';
 import { createOpenAI } from '@ai-sdk/openai';
 import { generateText } from 'ai';
 import dotenv from 'dotenv';
@@ -286,7 +286,7 @@ async function executeAction(page, action) {
     return 'CONTINUE';
 }
-async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo }) {
+async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo, browser: externalBrowser }) {
     console.log(`[Agent] Starting task: ${taskInput} on ${targetUrl} (Session: ${sessionId})`);
     const screenshotsDir = path.join(process.cwd(), 'screenshots');
@@ -295,11 +295,19 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
         console.log(`📁 创建截图目录: ${screenshotsDir}`);
     }
-    // 2. Launch Browser
-    const browser = await chromium.launch({
-        headless: true, // Visible for demo/debug
-        args: ['--start-maximized'] // Attempt to maximize
-    });
+    // 2. Launch Browser (or use existing)
+    let browser;
+    let shouldCloseBrowser = false;
+    if (externalBrowser) {
+        browser = externalBrowser;
+    } else {
+        browser = await chromium.launch({
+            headless: true, // Visible for demo/debug
+            args: ['--start-maximized'] // Attempt to maximize
+        });
+        shouldCloseBrowser = true;
+    }
     const context = await browser.newContext({
         viewport: { width: 430, height: 800 } // Set a reasonable fixed viewport
@@ -366,7 +374,33 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
             // 3. Query AI
             console.log("Querying AI...");
-            const aiContent = await queryAI(conversationHistory);
+            // Optimization: Window mode & Filter images
+            // 1. Keep last 20 rounds (40 messages) - Better memory than 3 rounds, but prevents infinite growth
+            let optimizedHistory = conversationHistory;
+            if (conversationHistory.length > 40) {
+                optimizedHistory = conversationHistory.slice(-40);
+            }
+            // 2. Filter images from older messages (Keep images only in the last 3 rounds / 6 messages)
+            // Strategy: "Fading Memory" - Recent = Full (Text+Img), Older = Text only
+            optimizedHistory = optimizedHistory.map((msg, index) => {
+                // Determine if this message is within the "recent 3 rounds" window
+                // length - 1 is the last item. length - 6 is the start of the last 3 rounds (User-AI, User-AI, User-AI)
+                const isRecent = index >= optimizedHistory.length - 6;
+                if (isRecent) return msg; // Keep recent messages intact (including images)
+                if (Array.isArray(msg.content)) {
+                    return {
+                        ...msg,
+                        content: msg.content.filter(c => c.type !== 'image')
+                    };
+                }
+                return msg;
+            });
+            const aiContent = await queryAI(optimizedHistory);
             if (!aiContent) {
                 console.error("Invalid AI response. Retrying...");
@@ -410,8 +444,13 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
         console.error("Runtime Custom Error:", error);
         return { status: 'error', message: error.message };
     } finally {
-        console.log("Closing browser...");
-        await browser.close();
+        if (shouldCloseBrowser) {
+            console.log("Closing browser...");
+            await browser.close();
+        } else {
+            console.log("Closing context...");
+            await context.close();
+        }
     }
 }
@@ -434,7 +473,6 @@ function getFormattedDate() {
  * @param {string} taskId - The ID of the task to run
  */
 async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAgent) {
-    const results = [];
     const datetime = getFormattedDate();
     const folderName = `${taskId}_${datetime}`;
     const outputDir = path.join(process.cwd(), folderName);
@@ -451,37 +489,59 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     console.log(`Starting Task Loop for ${taskId}`);
-    for (let i = 1; i <= 5; i++) {
-        console.log(`\n=== Starting Iteration ${i}/5 ===`);
-        try {
-            const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner);
-            const { sessionId, agentMessages, ...rest } = data;
-            // Create session subdirectory
-            const sessionDir = path.join(outputDir, sessionId);
-            if (!fs.existsSync(sessionDir)) {
-                fs.mkdirSync(sessionDir, { recursive: true });
-            }
+    // Launch a shared browser instance
+    const browser = await chromium.launch({
+        headless: true,
+        args: ['--start-maximized']
+    });
-            // Save messages.json
-            fs.writeFileSync(
-                path.join(sessionDir, 'messages.json'),
-                JSON.stringify(agentMessages, null, 2)
-            );
+    const results = [];
+    const MAX_CONCURRENCY = 5;
-            // Save result.json
-            fs.writeFileSync(
-                path.join(sessionDir, 'result.json'),
-                JSON.stringify(rest, null, 2)
-            );
+    try {
+        const promises = [];
+        for (let i = 1; i <= MAX_CONCURRENCY; i++) {
+            promises.push((async () => {
+                console.log(`\n=== Starting Iteration ${i}/${MAX_CONCURRENCY} ===`);
+                try {
+                    // Pass shared browser to executeSingleCycle
+                    const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner, browser);
+                    const { sessionId, agentMessages, ...rest } = data;
+                    // Create session subdirectory
+                    const sessionDir = path.join(outputDir, sessionId);
+                    if (!fs.existsSync(sessionDir)) {
+                        fs.mkdirSync(sessionDir, { recursive: true });
+                    }
+                    // Save messages.json
+                    fs.writeFileSync(
+                        path.join(sessionDir, 'messages.json'),
+                        JSON.stringify(agentMessages, null, 2)
+                    );
+                    // Save result.json
+                    fs.writeFileSync(
+                        path.join(sessionDir, 'result.json'),
+                        JSON.stringify(rest, null, 2)
+                    );
+                    console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+                    return { sessionId, ...rest };
+                } catch (e) {
+                    console.error(`Iteration ${i} failed:`, e.stack || e.message);
+                    return { iteration: i, error: e.message };
+                }
+            })());
+        }
-            results.push({ sessionId, ...rest });
-            console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+        // Wait for all to finish
+        const resultsArray = await Promise.all(promises);
+        results.push(...resultsArray);
-        } catch (e) {
-            console.error(`Iteration ${i} failed:`, e.stack || e.message);
-            results.push({ iteration: i, error: e.message });
-        }
+    } finally {
+        console.log("Closing shared browser...");
+        await browser.close();
     }
     // Save final-results.json (Consolidated)
@@ -489,7 +549,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     results.filter(r => r.verifyResult);
     const scores = results.map(r => r.verifyResult?.score || 0);
     const successCount = scores.filter(s => s === 1).length;
-    const total = 5; // Fixed 5 iterations
+    const total = MAX_CONCURRENCY;
     const rate = `${successCount}/${total}`;
     const summary = {
@@ -527,7 +587,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     };
 }
-async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner) {
+async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner, browser) {
     const fetchJson = async (url, opts) => {
         const res = await fetch(url, opts);
         if (!res.ok) {
@@ -562,7 +622,8 @@ async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, ag
         taskInput: TaskJson.task.instruction,
         targetUrl: targetWeb,
         sessionId: sessionId,
-        simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info
+        simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info,
+        browser: browser // Pass the shared browser instance
     });
     // 4. Verify Task

package/dist/index.js CHANGED Viewed

@@ -33,6 +33,7 @@ __export(index_exports, {
   runTaskLoop: () => runTaskLoop
 });
 module.exports = __toCommonJS(index_exports);
+var import_playwright2 = require("playwright");
 var import_fs2 = __toESM(require("fs"));
 var import_path3 = __toESM(require("path"));
@@ -294,19 +295,26 @@ async function executeAction(page, action) {
 }
 // src/runner.js
-async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo }) {
+async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo, browser: externalBrowser }) {
   console.log(`[Agent] Starting task: ${taskInput} on ${targetUrl} (Session: ${sessionId})`);
   const screenshotsDir = import_path2.default.join(process.cwd(), "screenshots");
   if (!import_fs.default.existsSync(screenshotsDir)) {
     import_fs.default.mkdirSync(screenshotsDir, { recursive: true });
     console.log(`\u{1F4C1} \u521B\u5EFA\u622A\u56FE\u76EE\u5F55: ${screenshotsDir}`);
   }
-  const browser = await import_playwright.chromium.launch({
-    headless: true,
-    // Visible for demo/debug
-    args: ["--start-maximized"]
-    // Attempt to maximize
-  });
+  let browser;
+  let shouldCloseBrowser = false;
+  if (externalBrowser) {
+    browser = externalBrowser;
+  } else {
+    browser = await import_playwright.chromium.launch({
+      headless: true,
+      // Visible for demo/debug
+      args: ["--start-maximized"]
+      // Attempt to maximize
+    });
+    shouldCloseBrowser = true;
+  }
   const context = await browser.newContext({
     viewport: { width: 430, height: 800 }
     // Set a reasonable fixed viewport
@@ -358,7 +366,22 @@ Please perform the next action based on the screenshot.`;
         content: userContent
       });
       console.log("Querying AI...");
-      const aiContent = await queryAI(conversationHistory);
+      let optimizedHistory = conversationHistory;
+      if (conversationHistory.length > 40) {
+        optimizedHistory = conversationHistory.slice(-40);
+      }
+      optimizedHistory = optimizedHistory.map((msg, index) => {
+        const isRecent = index >= optimizedHistory.length - 6;
+        if (isRecent) return msg;
+        if (Array.isArray(msg.content)) {
+          return {
+            ...msg,
+            content: msg.content.filter((c) => c.type !== "image")
+          };
+        }
+        return msg;
+      });
+      const aiContent = await queryAI(optimizedHistory);
       if (!aiContent) {
         console.error("Invalid AI response. Retrying...");
         await page.waitForTimeout(2e3);
@@ -391,8 +414,13 @@ Please perform the next action based on the screenshot.`;
     console.error("Runtime Custom Error:", error);
     return { status: "error", message: error.message };
   } finally {
-    console.log("Closing browser...");
-    await browser.close();
+    if (shouldCloseBrowser) {
+      console.log("Closing browser...");
+      await browser.close();
+    } else {
+      console.log("Closing context...");
+      await context.close();
+    }
   }
 }
@@ -406,7 +434,6 @@ function getFormattedDate() {
   return `${now.getFullYear()}${pad(now.getMonth() + 1)}${pad(now.getDate())}_${pad(now.getHours())}${pad(now.getMinutes())}${pad(now.getSeconds())}`;
 }
 async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAgent) {
-  const results = [];
   const datetime = getFormattedDate();
   const folderName = `${taskId}_${datetime}`;
   const outputDir = import_path3.default.join(process.cwd(), folderName);
@@ -417,30 +444,46 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
   if (!targetWeb.startsWith("http")) targetWeb = "http://" + targetWeb;
   if (!targetServer.startsWith("http")) targetServer = "http://" + targetServer;
   console.log(`Starting Task Loop for ${taskId}`);
-  for (let i = 1; i <= 5; i++) {
-    console.log(`
-=== Starting Iteration ${i}/5 ===`);
-    try {
-      const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner);
-      const { sessionId, agentMessages, ...rest } = data;
-      const sessionDir = import_path3.default.join(outputDir, sessionId);
-      if (!import_fs2.default.existsSync(sessionDir)) {
-        import_fs2.default.mkdirSync(sessionDir, { recursive: true });
-      }
-      import_fs2.default.writeFileSync(
-        import_path3.default.join(sessionDir, "messages.json"),
-        JSON.stringify(agentMessages, null, 2)
-      );
-      import_fs2.default.writeFileSync(
-        import_path3.default.join(sessionDir, "result.json"),
-        JSON.stringify(rest, null, 2)
-      );
-      results.push({ sessionId, ...rest });
-      console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
-    } catch (e) {
-      console.error(`Iteration ${i} failed:`, e.stack || e.message);
-      results.push({ iteration: i, error: e.message });
+  const browser = await import_playwright2.chromium.launch({
+    headless: true,
+    args: ["--start-maximized"]
+  });
+  const results = [];
+  const MAX_CONCURRENCY = 5;
+  try {
+    const promises = [];
+    for (let i = 1; i <= MAX_CONCURRENCY; i++) {
+      promises.push((async () => {
+        console.log(`
+=== Starting Iteration ${i}/${MAX_CONCURRENCY} ===`);
+        try {
+          const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner, browser);
+          const { sessionId, agentMessages, ...rest } = data;
+          const sessionDir = import_path3.default.join(outputDir, sessionId);
+          if (!import_fs2.default.existsSync(sessionDir)) {
+            import_fs2.default.mkdirSync(sessionDir, { recursive: true });
+          }
+          import_fs2.default.writeFileSync(
+            import_path3.default.join(sessionDir, "messages.json"),
+            JSON.stringify(agentMessages, null, 2)
+          );
+          import_fs2.default.writeFileSync(
+            import_path3.default.join(sessionDir, "result.json"),
+            JSON.stringify(rest, null, 2)
+          );
+          console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+          return { sessionId, ...rest };
+        } catch (e) {
+          console.error(`Iteration ${i} failed:`, e.stack || e.message);
+          return { iteration: i, error: e.message };
+        }
+      })());
     }
+    const resultsArray = await Promise.all(promises);
+    results.push(...resultsArray);
+  } finally {
+    console.log("Closing shared browser...");
+    await browser.close();
   }
   const validResults = results.filter((r) => r.verifyResult);
   const scores = results.map((r) => {
@@ -448,7 +491,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     return ((_a = r.verifyResult) == null ? void 0 : _a.score) || 0;
   });
   const successCount = scores.filter((s) => s === 1).length;
-  const total = 5;
+  const total = MAX_CONCURRENCY;
   const rate = `${successCount}/${total}`;
   const summary = {
     rate,
@@ -479,7 +522,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     taskId
   };
 }
-async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner) {
+async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner, browser) {
   const fetchJson = async (url, opts) => {
     const res = await fetch(url, opts);
     if (!res.ok) {
@@ -507,7 +550,9 @@ async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, ag
     taskInput: TaskJson.task.instruction,
     targetUrl: targetWeb,
     sessionId,
-    simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info
+    simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info,
+    browser
+    // Pass the shared browser instance
   });
   console.log("Verifying result...");
   const verifyUrl = `${targetServer}/api/verify/run`;

package/dist/index.mjs CHANGED Viewed

@@ -1,4 +1,5 @@
 // src/index.js
+import { chromium as chromium2 } from "playwright";
 import fs2 from "fs";
 import path3 from "path";
@@ -260,19 +261,26 @@ async function executeAction(page, action) {
 }
 // src/runner.js
-async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo }) {
+async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo, browser: externalBrowser }) {
   console.log(`[Agent] Starting task: ${taskInput} on ${targetUrl} (Session: ${sessionId})`);
   const screenshotsDir = path2.join(process.cwd(), "screenshots");
   if (!fs.existsSync(screenshotsDir)) {
     fs.mkdirSync(screenshotsDir, { recursive: true });
     console.log(`\u{1F4C1} \u521B\u5EFA\u622A\u56FE\u76EE\u5F55: ${screenshotsDir}`);
   }
-  const browser = await chromium.launch({
-    headless: true,
-    // Visible for demo/debug
-    args: ["--start-maximized"]
-    // Attempt to maximize
-  });
+  let browser;
+  let shouldCloseBrowser = false;
+  if (externalBrowser) {
+    browser = externalBrowser;
+  } else {
+    browser = await chromium.launch({
+      headless: true,
+      // Visible for demo/debug
+      args: ["--start-maximized"]
+      // Attempt to maximize
+    });
+    shouldCloseBrowser = true;
+  }
   const context = await browser.newContext({
     viewport: { width: 430, height: 800 }
     // Set a reasonable fixed viewport
@@ -324,7 +332,22 @@ Please perform the next action based on the screenshot.`;
         content: userContent
       });
       console.log("Querying AI...");
-      const aiContent = await queryAI(conversationHistory);
+      let optimizedHistory = conversationHistory;
+      if (conversationHistory.length > 40) {
+        optimizedHistory = conversationHistory.slice(-40);
+      }
+      optimizedHistory = optimizedHistory.map((msg, index) => {
+        const isRecent = index >= optimizedHistory.length - 6;
+        if (isRecent) return msg;
+        if (Array.isArray(msg.content)) {
+          return {
+            ...msg,
+            content: msg.content.filter((c) => c.type !== "image")
+          };
+        }
+        return msg;
+      });
+      const aiContent = await queryAI(optimizedHistory);
       if (!aiContent) {
         console.error("Invalid AI response. Retrying...");
         await page.waitForTimeout(2e3);
@@ -357,8 +380,13 @@ Please perform the next action based on the screenshot.`;
     console.error("Runtime Custom Error:", error);
     return { status: "error", message: error.message };
   } finally {
-    console.log("Closing browser...");
-    await browser.close();
+    if (shouldCloseBrowser) {
+      console.log("Closing browser...");
+      await browser.close();
+    } else {
+      console.log("Closing context...");
+      await context.close();
+    }
   }
 }
@@ -372,7 +400,6 @@ function getFormattedDate() {
   return `${now.getFullYear()}${pad(now.getMonth() + 1)}${pad(now.getDate())}_${pad(now.getHours())}${pad(now.getMinutes())}${pad(now.getSeconds())}`;
 }
 async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAgent) {
-  const results = [];
   const datetime = getFormattedDate();
   const folderName = `${taskId}_${datetime}`;
   const outputDir = path3.join(process.cwd(), folderName);
@@ -383,30 +410,46 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
   if (!targetWeb.startsWith("http")) targetWeb = "http://" + targetWeb;
   if (!targetServer.startsWith("http")) targetServer = "http://" + targetServer;
   console.log(`Starting Task Loop for ${taskId}`);
-  for (let i = 1; i <= 5; i++) {
-    console.log(`
-=== Starting Iteration ${i}/5 ===`);
-    try {
-      const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner);
-      const { sessionId, agentMessages, ...rest } = data;
-      const sessionDir = path3.join(outputDir, sessionId);
-      if (!fs2.existsSync(sessionDir)) {
-        fs2.mkdirSync(sessionDir, { recursive: true });
-      }
-      fs2.writeFileSync(
-        path3.join(sessionDir, "messages.json"),
-        JSON.stringify(agentMessages, null, 2)
-      );
-      fs2.writeFileSync(
-        path3.join(sessionDir, "result.json"),
-        JSON.stringify(rest, null, 2)
-      );
-      results.push({ sessionId, ...rest });
-      console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
-    } catch (e) {
-      console.error(`Iteration ${i} failed:`, e.stack || e.message);
-      results.push({ iteration: i, error: e.message });
+  const browser = await chromium2.launch({
+    headless: true,
+    args: ["--start-maximized"]
+  });
+  const results = [];
+  const MAX_CONCURRENCY = 5;
+  try {
+    const promises = [];
+    for (let i = 1; i <= MAX_CONCURRENCY; i++) {
+      promises.push((async () => {
+        console.log(`
+=== Starting Iteration ${i}/${MAX_CONCURRENCY} ===`);
+        try {
+          const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner, browser);
+          const { sessionId, agentMessages, ...rest } = data;
+          const sessionDir = path3.join(outputDir, sessionId);
+          if (!fs2.existsSync(sessionDir)) {
+            fs2.mkdirSync(sessionDir, { recursive: true });
+          }
+          fs2.writeFileSync(
+            path3.join(sessionDir, "messages.json"),
+            JSON.stringify(agentMessages, null, 2)
+          );
+          fs2.writeFileSync(
+            path3.join(sessionDir, "result.json"),
+            JSON.stringify(rest, null, 2)
+          );
+          console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+          return { sessionId, ...rest };
+        } catch (e) {
+          console.error(`Iteration ${i} failed:`, e.stack || e.message);
+          return { iteration: i, error: e.message };
+        }
+      })());
     }
+    const resultsArray = await Promise.all(promises);
+    results.push(...resultsArray);
+  } finally {
+    console.log("Closing shared browser...");
+    await browser.close();
   }
   const validResults = results.filter((r) => r.verifyResult);
   const scores = results.map((r) => {
@@ -414,7 +457,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     return ((_a = r.verifyResult) == null ? void 0 : _a.score) || 0;
   });
   const successCount = scores.filter((s) => s === 1).length;
-  const total = 5;
+  const total = MAX_CONCURRENCY;
   const rate = `${successCount}/${total}`;
   const summary = {
     rate,
@@ -445,7 +488,7 @@ async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAge
     taskId
   };
 }
-async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner) {
+async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner, browser) {
   const fetchJson = async (url, opts) => {
     const res = await fetch(url, opts);
     if (!res.ok) {
@@ -473,7 +516,9 @@ async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, ag
     taskInput: TaskJson.task.instruction,
     targetUrl: targetWeb,
     sessionId,
-    simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info
+    simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info,
+    browser
+    // Pass the shared browser instance
   });
   console.log("Verifying result...");
   const verifyUrl = `${targetServer}/api/verify/run`;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rl-simulator-core",
-  "version": "1.0.8",
+  "version": "1.2.0",
   "main": "./dist/index.js",
   "module": "./dist/index.mjs",
   "types": "./dist/index.d.ts",

package/src/index.js CHANGED Viewed

@@ -1,4 +1,4 @@
+import { chromium } from 'playwright';
 import fs from 'fs';
 import path from 'path';
 import { runAgent } from './runner.js';
@@ -26,7 +26,6 @@ function getFormattedDate() {
  * @param {string} taskId - The ID of the task to run
  */
 export async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner = runAgent) {
-    const results = [];
     const datetime = getFormattedDate();
     const folderName = `${taskId}_${datetime}`;
     const outputDir = path.join(process.cwd(), folderName);
@@ -43,37 +42,59 @@ export async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner =
     console.log(`Starting Task Loop for ${taskId}`);
-    for (let i = 1; i <= 5; i++) {
-        console.log(`\n=== Starting Iteration ${i}/5 ===`);
-        try {
-            const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner);
-            const { sessionId, agentMessages, ...rest } = data;
-            // Create session subdirectory
-            const sessionDir = path.join(outputDir, sessionId);
-            if (!fs.existsSync(sessionDir)) {
-                fs.mkdirSync(sessionDir, { recursive: true });
-            }
-            // Save messages.json
-            fs.writeFileSync(
-                path.join(sessionDir, 'messages.json'),
-                JSON.stringify(agentMessages, null, 2)
-            );
-            // Save result.json
-            fs.writeFileSync(
-                path.join(sessionDir, 'result.json'),
-                JSON.stringify(rest, null, 2)
-            );
-            results.push({ sessionId, ...rest });
-            console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
-        } catch (e) {
-            console.error(`Iteration ${i} failed:`, e.stack || e.message);
-            results.push({ iteration: i, error: e.message });
+    // Launch a shared browser instance
+    const browser = await chromium.launch({
+        headless: true,
+        args: ['--start-maximized']
+    });
+    const results = [];
+    const MAX_CONCURRENCY = 5;
+    try {
+        const promises = [];
+        for (let i = 1; i <= MAX_CONCURRENCY; i++) {
+            promises.push((async () => {
+                console.log(`\n=== Starting Iteration ${i}/${MAX_CONCURRENCY} ===`);
+                try {
+                    // Pass shared browser to executeSingleCycle
+                    const data = await executeSingleCycle(targetWeb, targetServer, taskId, i, agentRunner, browser);
+                    const { sessionId, agentMessages, ...rest } = data;
+                    // Create session subdirectory
+                    const sessionDir = path.join(outputDir, sessionId);
+                    if (!fs.existsSync(sessionDir)) {
+                        fs.mkdirSync(sessionDir, { recursive: true });
+                    }
+                    // Save messages.json
+                    fs.writeFileSync(
+                        path.join(sessionDir, 'messages.json'),
+                        JSON.stringify(agentMessages, null, 2)
+                    );
+                    // Save result.json
+                    fs.writeFileSync(
+                        path.join(sessionDir, 'result.json'),
+                        JSON.stringify(rest, null, 2)
+                    );
+                    console.log(`Iteration ${i} completed. Saved to ${sessionDir}`);
+                    return { sessionId, ...rest };
+                } catch (e) {
+                    console.error(`Iteration ${i} failed:`, e.stack || e.message);
+                    return { iteration: i, error: e.message };
+                }
+            })());
         }
+        // Wait for all to finish
+        const resultsArray = await Promise.all(promises);
+        results.push(...resultsArray);
+    } finally {
+        console.log("Closing shared browser...");
+        await browser.close();
     }
     // Save final-results.json (Consolidated)
@@ -81,7 +102,7 @@ export async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner =
     const validResults = results.filter(r => r.verifyResult);
     const scores = results.map(r => r.verifyResult?.score || 0);
     const successCount = scores.filter(s => s === 1).length;
-    const total = 5; // Fixed 5 iterations
+    const total = MAX_CONCURRENCY;
     const rate = `${successCount}/${total}`;
     const summary = {
@@ -119,7 +140,7 @@ export async function runTaskLoop(targetWeb, targetServer, taskId, agentRunner =
     };
 }
-async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner) {
+async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, agentRunner, browser) {
     const fetchJson = async (url, opts) => {
         const res = await fetch(url, opts);
         if (!res.ok) {
@@ -154,7 +175,8 @@ async function executeSingleCycle(targetWeb, targetServer, taskId, iteration, ag
         taskInput: TaskJson.task.instruction,
         targetUrl: targetWeb,
         sessionId: sessionId,
-        simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info
+        simulatedUserKnownInfo: TaskJson.task.simulated_user_known_info,
+        browser: browser // Pass the shared browser instance
     });
     // 4. Verify Task

package/src/runner.js CHANGED Viewed

@@ -4,7 +4,7 @@ import path from 'path';
 import { queryAI, parseActions } from './ai.js';
 import { executeAction } from './actions.js';
-async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo }) {
+async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInfo, browser: externalBrowser }) {
     console.log(`[Agent] Starting task: ${taskInput} on ${targetUrl} (Session: ${sessionId})`);
     const screenshotsDir = path.join(process.cwd(), 'screenshots');
@@ -13,11 +13,19 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
         console.log(`📁 创建截图目录: ${screenshotsDir}`);
     }
-    // 2. Launch Browser
-    const browser = await chromium.launch({
-        headless: true, // Visible for demo/debug
-        args: ['--start-maximized'] // Attempt to maximize
-    });
+    // 2. Launch Browser (or use existing)
+    let browser;
+    let shouldCloseBrowser = false;
+    if (externalBrowser) {
+        browser = externalBrowser;
+    } else {
+        browser = await chromium.launch({
+            headless: true, // Visible for demo/debug
+            args: ['--start-maximized'] // Attempt to maximize
+        });
+        shouldCloseBrowser = true;
+    }
     const context = await browser.newContext({
         viewport: { width: 430, height: 800 } // Set a reasonable fixed viewport
@@ -84,7 +92,33 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
             // 3. Query AI
             console.log("Querying AI...");
-            const aiContent = await queryAI(conversationHistory);
+            // Optimization: Window mode & Filter images
+            // 1. Keep last 20 rounds (40 messages) - Better memory than 3 rounds, but prevents infinite growth
+            let optimizedHistory = conversationHistory;
+            if (conversationHistory.length > 40) {
+                optimizedHistory = conversationHistory.slice(-40);
+            }
+            // 2. Filter images from older messages (Keep images only in the last 3 rounds / 6 messages)
+            // Strategy: "Fading Memory" - Recent = Full (Text+Img), Older = Text only
+            optimizedHistory = optimizedHistory.map((msg, index) => {
+                // Determine if this message is within the "recent 3 rounds" window
+                // length - 1 is the last item. length - 6 is the start of the last 3 rounds (User-AI, User-AI, User-AI)
+                const isRecent = index >= optimizedHistory.length - 6;
+                if (isRecent) return msg; // Keep recent messages intact (including images)
+                if (Array.isArray(msg.content)) {
+                    return {
+                        ...msg,
+                        content: msg.content.filter(c => c.type !== 'image')
+                    };
+                }
+                return msg;
+            });
+            const aiContent = await queryAI(optimizedHistory);
             if (!aiContent) {
                 console.error("Invalid AI response. Retrying...");
@@ -128,8 +162,13 @@ async function runAgent({ targetUrl, taskInput, sessionId, simulatedUserKnownInf
         console.error("Runtime Custom Error:", error);
         return { status: 'error', message: error.message };
     } finally {
-        console.log("Closing browser...");
-        await browser.close();
+        if (shouldCloseBrowser) {
+            console.log("Closing browser...");
+            await browser.close();
+        } else {
+            console.log("Closing context...");
+            await context.close();
+        }
     }
 }