npm - @empiricalrun/test-gen - Versions diffs - 0.31.10 → 0.31.13 - Mend

@empiricalrun/test-gen 0.31.10 → 0.31.13

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/CHANGELOG.md +21 -0
package/dist/actions/next-task.d.ts.map +1 -1
package/dist/actions/next-task.js +2 -1
package/dist/actions/utils/index.d.ts.map +1 -1
package/dist/actions/utils/index.js +2 -1
package/dist/agent/browsing/o1-completion.d.ts.map +1 -1
package/dist/agent/browsing/o1-completion.js +1 -0
package/dist/agent/master/run.d.ts +9 -0
package/dist/agent/master/run.d.ts.map +1 -1
package/dist/agent/master/run.js +24 -12
package/dist/bin/index.js +6 -4
package/package.json +3 -3

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,26 @@
 # @empiricalrun/test-gen
+## 0.31.13
+### Patch Changes
+- 759bfc0: fix: accuracy of element selector
+## 0.31.12
+### Patch Changes
+- a8f2ea6: chore: add test for master agent
+- Updated dependencies [10f554d]
+  - @empiricalrun/reporter@0.20.2
+## 0.31.11
+### Patch Changes
+- Updated dependencies [9623b74]
+  - @empiricalrun/reporter@0.20.1
 ## 0.31.10
 ### Patch Changes

package/dist/actions/next-task.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"next-task.d.ts","sourceRoot":"","sources":["../../src/actions/next-task.ts"],"names":[],"mappings":"AAAA,eAAO,MAAM,SAAS,cAAc,CAAC;AAErC,eAAO,MAAM,cAAc;;;;;;;;;;;;;;;;;;;;;;;~~CA0B1B~~,CAAC"}
1	+ {"version":3,"file":"next-task.d.ts","sourceRoot":"","sources":["../../src/actions/next-task.ts"],"names":[],"mappings":"AAAA,eAAO,MAAM,SAAS,cAAc,CAAC;AAErC,eAAO,MAAM,cAAc;;;;;;;;;;;;;;;;;;;;;;;CA2B1B,CAAC"}

package/dist/actions/next-task.js CHANGED Viewed

@@ -15,7 +15,8 @@ exports.NextTaskAction = {
                     action: {
                         type: "string",
                         description: `explain the next action in natural language.
-The next action should be as atomic as possible. E.g. each click, key press, input should be a separate action.
+The next action should be as atomic as possible, precise and should contain enough details about the action to be performed.
+E.g. each click, key press, input, assert should be a separate action.
 Each action should take the task to completion, if not the action is invalid.`,
                     },
                     reason: {

package/dist/actions/utils/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/actions/utils/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,IAAI,EAAE,MAAM,YAAY,CAAC;AAElC,OAAO,CAAC,MAAM,CAAC;IACb,UAAU,MAAM;QACd,UAAU,EAAE,GAAG,CAAC;QAChB,MAAM,EAAE,GAAG,CAAC;KACb;CACF;AAED,wBAAsB,oCAAoC,CACxD,WAAW,EAAE,MAAM,EACnB,KAAK,EAAE,MAAM,EACb,IAAI,EAAE,IAAI,~~gBA6CX~~;AAED,wBAAgB,cAAc,WAG7B"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/actions/utils/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,IAAI,EAAE,MAAM,YAAY,CAAC;AAElC,OAAO,CAAC,MAAM,CAAC;IACb,UAAU,MAAM;QACd,UAAU,EAAE,GAAG,CAAC;QAChB,MAAM,EAAE,GAAG,CAAC;KACb;CACF;AAED,wBAAsB,oCAAoC,CACxD,WAAW,EAAE,MAAM,EACnB,KAAK,EAAE,MAAM,EACb,IAAI,EAAE,IAAI,gBA8CX;AAED,wBAAgB,cAAc,WAG7B"}

package/dist/actions/utils/index.js CHANGED Viewed

@@ -14,7 +14,8 @@ async function getPlaywrightLocatorUsingCssSelector(cssSelector, xpath, page) {
         }
         let selectedElem;
         try {
-            selectedElem = getElementByXpath(locator.xpath);
+            const xpath = locator.xpath?.replaceAll("text()", "normalize-space()");
+            selectedElem = getElementByXpath(xpath);
         }
         catch (e) {
             // ignore error

package/dist/agent/browsing/o1-completion.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"o1-completion.d.ts","sourceRoot":"","sources":["../../../src/agent/browsing/o1-completion.ts"],"names":[],"mappings":"AAAA,OAAO,EAAO,WAAW,EAAE,MAAM,mBAAmB,CAAC;AACrD,OAAO,EACL,qBAAqB,EACrB,0BAA0B,EAC1B,kBAAkB,EACnB,MAAM,4BAA4B,CAAC;AAKpC,wBAAsB,eAAe,CAAC,EACpC,QAAQ,EACR,KAAK,EACL,KAAK,GACN,EAAE;IACD,QAAQ,EAAE,0BAA0B,EAAE,CAAC;IACvC,KAAK,EAAE,kBAAkB,EAAE,CAAC;IAC5B,KAAK,CAAC,EAAE,WAAW,CAAC;CACrB,GAAG,OAAO,CAAC,qBAAqB,GAAG,SAAS,CAAC,~~CAyD7C~~"}
1	+ {"version":3,"file":"o1-completion.d.ts","sourceRoot":"","sources":["../../../src/agent/browsing/o1-completion.ts"],"names":[],"mappings":"AAAA,OAAO,EAAO,WAAW,EAAE,MAAM,mBAAmB,CAAC;AACrD,OAAO,EACL,qBAAqB,EACrB,0BAA0B,EAC1B,kBAAkB,EACnB,MAAM,4BAA4B,CAAC;AAKpC,wBAAsB,eAAe,CAAC,EACpC,QAAQ,EACR,KAAK,EACL,KAAK,GACN,EAAE;IACD,QAAQ,EAAE,0BAA0B,EAAE,CAAC;IACvC,KAAK,EAAE,kBAAkB,EAAE,CAAC;IAC5B,KAAK,CAAC,EAAE,WAAW,CAAC;CACrB,GAAG,OAAO,CAAC,qBAAqB,GAAG,SAAS,CAAC,CA0D7C"}

package/dist/agent/browsing/o1-completion.js CHANGED Viewed

@@ -31,6 +31,7 @@ async function getO1Completion({ messages, tools, trace, }) {
     Before responding, ensure the following:
     - Do not respond with markdown, respond only with the JSON object.
     - Do not respond with any backticks.
+    - The reason for action should also include what was been executed in the action.
   `;
         const response = (await llm.createChatCompletion({
             messages: [userInstruction],

package/dist/agent/master/run.d.ts CHANGED Viewed

@@ -2,6 +2,15 @@ import { LLM, TraceClient } from "@empiricalrun/llm";
 import { Page } from "playwright";
 import { TestGenConfigOptions } from "../../types";
 type BrowsingAgentOptions = Partial<TestGenConfigOptions>;
+export declare function getNextAction({ task, executedActions, page, trace, llm, options, pageScreenshot, }: {
+    task: string;
+    executedActions: string[];
+    page: Page;
+    trace?: TraceClient;
+    llm: LLM;
+    options: BrowsingAgentOptions;
+    pageScreenshot: string;
+}): Promise<import("openai/resources/index.mjs").ChatCompletionMessageToolCall | undefined>;
 export declare function masterAgent(task: string, page: Page, executedActions: string[], trace: TraceClient, llm: LLM, options: BrowsingAgentOptions): Promise<any>;
 export {};
 //# sourceMappingURL=run.d.ts.map

package/dist/agent/master/run.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"run.d.ts","sourceRoot":"","sources":["../../../src/agent/master/run.ts"],"names":[],"mappings":"AAAA,OAAO,EAAa,GAAG,EAAE,WAAW,EAAE,MAAM,mBAAmB,CAAC;AAGhE,OAAO,EAAE,IAAI,EAAE,MAAM,YAAY,CAAC;~~AASlC~~,OAAO,EAAE,oBAAoB,EAAE,MAAM,aAAa,CAAC;AAEnD,KAAK,oBAAoB,GAAG,OAAO,CAAC,oBAAoB,CAAC,CAAC;AAE1D,wBAAsB,WAAW,CAC/B,IAAI,EAAE,MAAM,EACZ,IAAI,EAAE,IAAI,EACV,eAAe,EAAE,MAAM,EAAE,EACzB,KAAK,EAAE,WAAW,EAClB,GAAG,EAAE,GAAG,EACR,OAAO,EAAE,oBAAoB,~~gBA0E9B~~"}
1	+ {"version":3,"file":"run.d.ts","sourceRoot":"","sources":["../../../src/agent/master/run.ts"],"names":[],"mappings":"AAAA,OAAO,EAAa,GAAG,EAAE,WAAW,EAAE,MAAM,mBAAmB,CAAC;AAGhE,OAAO,EAAE,IAAI,EAAE,MAAM,YAAY,CAAC;AAQlC,OAAO,EAAE,oBAAoB,EAAE,MAAM,aAAa,CAAC;AAEnD,KAAK,oBAAoB,GAAG,OAAO,CAAC,oBAAoB,CAAC,CAAC;AAE1D,wBAAsB,aAAa,CAAC,EAClC,IAAI,EACJ,eAAe,EACf,IAAI,EACJ,KAAK,EACL,GAAG,EACH,OAAO,EACP,cAAc,GACf,EAAE;IACD,IAAI,EAAE,MAAM,CAAC;IACb,eAAe,EAAE,MAAM,EAAE,CAAC;IAC1B,IAAI,EAAE,IAAI,CAAC;IACX,KAAK,CAAC,EAAE,WAAW,CAAC;IACpB,GAAG,EAAE,GAAG,CAAC;IACT,OAAO,EAAE,oBAAoB,CAAC;IAC9B,cAAc,EAAE,MAAM,CAAC;CACxB,2FA+CA;AAED,wBAAsB,WAAW,CAC/B,IAAI,EAAE,MAAM,EACZ,IAAI,EAAE,IAAI,EACV,eAAe,EAAE,MAAM,EAAE,EACzB,KAAK,EAAE,WAAW,EAClB,GAAG,EAAE,GAAG,EACR,OAAO,EAAE,oBAAoB,gBAsC9B"}

package/dist/agent/master/run.js CHANGED Viewed

@@ -1,19 +1,13 @@
 "use strict";
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.masterAgent = void 0;
+exports.masterAgent = exports.getNextAction = void 0;
 const llm_1 = require("@empiricalrun/llm");
 const vision_1 = require("@empiricalrun/llm/vision");
-const done_1 = require("../../actions/done");
 const next_task_1 = require("../../actions/next-task");
 const constants_1 = require("../../constants");
 const reporter_1 = require("../../reporter");
-async function masterAgent(task, page, executedActions, trace, llm, options) {
-    trace.update({ input: { task } });
-    const promptSpan = trace.span({ name: "page-prompt" });
-    const buffer = await page.screenshot({ fullPage: true });
-    const testGenReporter = new reporter_1.TestGenUpdatesReporter();
-    const testGenSnapshotUpdatePromise = testGenReporter.sendCurrentView(buffer);
-    const pageScreenshot = buffer.toString("base64");
+async function getNextAction({ task, executedActions, page, trace, llm, options, pageScreenshot, }) {
+    const promptSpan = trace?.span({ name: "page-prompt" });
     const promptMessages = await (0, llm_1.getPrompt)("test-gen", {
         task,
         executedActions: executedActions.map((a) => a).join("\n"),
@@ -38,8 +32,8 @@ async function masterAgent(task, page, executedActions, trace, llm, options) {
         systemMessage,
         userMessage,
     ];
-    const tools = [next_task_1.NextTaskAction.schema, (0, done_1.doneActionGenerator)(page).schema];
-    promptSpan.end({ output: { messages } });
+    const tools = [next_task_1.NextTaskAction.schema];
+    promptSpan?.end({ output: { messages } });
     const completion = await llm.createChatCompletion({
         messages,
         modelParameters: {
@@ -52,8 +46,26 @@ async function masterAgent(task, page, executedActions, trace, llm, options) {
         // @ts-ignore
         tools,
     });
-    let output;
     const toolCall = completion?.tool_calls?.[0];
+    return toolCall;
+}
+exports.getNextAction = getNextAction;
+async function masterAgent(task, page, executedActions, trace, llm, options) {
+    trace.update({ input: { task } });
+    const buffer = await page.screenshot({ fullPage: true });
+    const testGenReporter = new reporter_1.TestGenUpdatesReporter();
+    const testGenSnapshotUpdatePromise = testGenReporter.sendCurrentView(buffer);
+    const pageScreenshot = buffer.toString("base64");
+    let output;
+    const toolCall = await getNextAction({
+        task,
+        executedActions,
+        page,
+        trace,
+        llm,
+        options,
+        pageScreenshot,
+    });
     if (toolCall) {
         if (toolCall.function.name === "task_done") {
             output = {

package/dist/bin/index.js CHANGED Viewed

@@ -69,10 +69,12 @@ async function runAgent(testGenConfig) {
         testGenFailed = true;
         new logger_1.CustomLogger().error(`Failed to generate test for the scenario. ${process.env.LOG_URL ? `[view log](${process.env.LOG_URL})` : ""}`);
     }
-    await new reporter_1.TestGenUpdatesReporter().reportGenAssets({
-        projectRepoName: testGenConfig.options.metadata.projectRepoName,
-        testName: testGenConfig.testCase.name,
-    });
+    if (testGenConfig.options?.agent !== "code") {
+        await new reporter_1.TestGenUpdatesReporter().reportGenAssets({
+            projectRepoName: testGenConfig.options.metadata.projectRepoName,
+            testName: testGenConfig.testCase.name,
+        });
+    }
     // TODO: move these reporters to a better lifecycle
     await (0, ci_1.reportOnCI)(testGenConfig.testCase);
     await (0, llm_1.flushAllTraces)();

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@empiricalrun/test-gen",
-  "version": "0.31.10",
+  "version": "0.31.13",
   "publishConfig": {
     "registry": "https://registry.npmjs.org/",
     "access": "public"
@@ -44,9 +44,9 @@
     "ts-morph": "^23.0.0",
     "tsx": "^4.16.2",
     "typescript": "^5.3.3",
-    "@empiricalrun/llm": "^0.9.3",
     "@empiricalrun/r2-uploader": "^0.3.3",
-    "@empiricalrun/reporter": "^0.20.0"
+    "@empiricalrun/reporter": "^0.20.2",
+    "@empiricalrun/llm": "^0.9.3"
   },
   "devDependencies": {
     "@types/detect-port": "^1.3.5",