npm - @empiricalrun/test-gen - Versions diffs - 0.51.5 → 0.52.0 - Mend

@empiricalrun/test-gen 0.51.5 → 0.52.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

package/CHANGELOG.md +30 -0
package/dist/agent/browsing/run.d.ts.map +1 -1
package/dist/agent/chat/index.d.ts +5 -0
package/dist/agent/chat/index.d.ts.map +1 -0
package/dist/agent/chat/index.js +129 -0
package/dist/agent/chat/prompt.d.ts +2 -0
package/dist/agent/chat/prompt.d.ts.map +1 -0
package/dist/agent/chat/prompt.js +74 -0
package/dist/agent/chat/repo.d.ts +2 -0
package/dist/agent/chat/repo.d.ts.map +1 -0
package/dist/agent/chat/repo.js +64 -0
package/dist/agent/cua/index.d.ts.map +1 -1
package/dist/agent/cua/index.js +10 -35
package/dist/agent/cua/model.d.ts +8 -0
package/dist/agent/cua/model.d.ts.map +1 -0
package/dist/agent/cua/model.js +35 -0
package/dist/bin/index.js +3 -2
package/dist/bin/logger/index.js +3 -3
package/dist/bin/utils/index.d.ts +1 -1
package/dist/bin/utils/index.d.ts.map +1 -1
package/dist/bin/utils/platform/web/index.d.ts +5 -0
package/dist/bin/utils/platform/web/index.d.ts.map +1 -1
package/dist/bin/utils/platform/web/index.js +13 -1
package/dist/reporter/index.d.ts +1 -1
package/dist/reporter/index.d.ts.map +1 -1
package/dist/reporter/index.js +8 -8
package/dist/reporter/lib.d.ts +31 -0
package/dist/reporter/lib.d.ts.map +1 -0
package/dist/reporter/lib.js +72 -0
package/dist/tools/test-gen-browser.d.ts.map +1 -1
package/dist/tools/test-gen-browser.js +7 -0
package/dist/uploader/index.d.ts.map +1 -1
package/dist/uploader/index.js +3 -3
package/dist/uploader/utils.d.ts +8 -0
package/dist/uploader/utils.d.ts.map +1 -0
package/dist/uploader/utils.js +35 -0
package/dist/utils/repo-tree.d.ts.map +1 -1
package/dist/utils/repo-tree.js +2 -0
package/package.json +4 -3
package/dist/agent/chat.d.ts +0 -5
package/dist/agent/chat.d.ts.map +0 -1
package/dist/agent/chat.js +0 -188

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,35 @@
 # @empiricalrun/test-gen
+## 0.52.0
+### Minor Changes
+- a399a57: feat: added Gemini support to chat agent
+### Patch Changes
+- 1b8d273: fix: clean up backup files
+- Updated dependencies [a399a57]
+- Updated dependencies [1b8d273]
+- Updated dependencies [99b0826]
+  - @empiricalrun/llm@0.12.0
+## 0.51.6
+### Patch Changes
+- dc17737: fix: repo context dir not found
+- b058de5: feat: add app knowledge to chat agent system prompt
+- dbe2ace: fix: remove Anthropic type from chat agent
+- ce7fece: fix: improvements to cua usage in test-gen-browser tool call
+- b8b4eff: fix: crash when last-chat is not found
+- af84555: chore: remove reporter dependency from test-gen package
+- 2766be8: feat: introduce chat model interface to support multiple llms
+- Updated dependencies [dbe2ace]
+- Updated dependencies [b8b4eff]
+- Updated dependencies [2766be8]
+  - @empiricalrun/llm@0.11.5
 ## 0.51.5
 ### Patch Changes

package/dist/agent/browsing/run.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"run.d.ts","sourceRoot":"","sources":["../../../src/agent/browsing/run.ts"],"names":[],"mappings":"AAiBA,KAAK,iBAAiB,GAAG;IACvB,YAAY,EAAE,MAAM,CAAC;IACrB,gBAAgB,EAAE,MAAM,CAAC;IACzB,gBAAgB,EAAE,MAAM,EAAE,CAAC;IAC3B,YAAY,EAAE,MAAM,CAAC;IACrB,OAAO,EAAE,MAAM,CAAC;CACjB,CAAC;AAEF,wBAAsB,6BAA6B,CAAC,EAClD,YAAY,EACZ,gBAAgB,EAChB,gBAAgB,EAChB,YAAY,EACZ,OAAO,GACR,EAAE,iBAAiB~~;;;GAgFnB~~"}
1	+ {"version":3,"file":"run.d.ts","sourceRoot":"","sources":["../../../src/agent/browsing/run.ts"],"names":[],"mappings":"AAiBA,KAAK,iBAAiB,GAAG;IACvB,YAAY,EAAE,MAAM,CAAC;IACrB,gBAAgB,EAAE,MAAM,CAAC;IACzB,gBAAgB,EAAE,MAAM,EAAE,CAAC;IAC3B,YAAY,EAAE,MAAM,CAAC;IACrB,OAAO,EAAE,MAAM,CAAC;CACjB,CAAC;AAEF,wBAAsB,6BAA6B,CAAC,EAClD,YAAY,EACZ,gBAAgB,EAChB,gBAAgB,EAChB,YAAY,EACZ,OAAO,GACR,EAAE,iBAAiB,GAAG,OAAO,CAAC;IAC7B,OAAO,EAAE,OAAO,CAAC;IACjB,KAAK,EAAE,MAAM,CAAC;CACf,CAAC,CAgFD"}

package/dist/agent/chat/index.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+export declare function chatAgent({ selectedModel, useDiskForChatState, }: {
+    selectedModel?: "claude-3-7-sonnet-20250219" | "claude-3-5-sonnet-20241022" | "gemini-2.5-pro-exp-03-25";
+    useDiskForChatState?: boolean;
+}): Promise<string>;
+//# sourceMappingURL=index.d.ts.map

package/dist/agent/chat/index.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/agent/chat/index.ts"],"names":[],"mappings":"AA4DA,wBAAsB,SAAS,CAAC,EAC9B,aAA4C,EAC5C,mBAA2B,GAC5B,EAAE;IACD,aAAa,CAAC,EACV,4BAA4B,GAC5B,4BAA4B,GAC5B,0BAA0B,CAAC;IAC/B,mBAAmB,CAAC,EAAE,OAAO,CAAC;CAC/B,mBA2FA"}

package/dist/agent/chat/index.js ADDED Viewed

@@ -0,0 +1,129 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.chatAgent = void 0;
+const chat_1 = require("@empiricalrun/llm/chat");
+const picocolors_1 = require("picocolors");
+const web_1 = require("../../bin/utils/platform/web");
+const human_in_the_loop_1 = require("../../human-in-the-loop");
+const diagnosis_fetcher_1 = require("../../tools/diagnosis-fetcher");
+const grep_1 = require("../../tools/grep");
+const test_gen_browser_1 = require("../../tools/test-gen-browser");
+const test_run_1 = require("../../tools/test-run");
+const test_run_fetcher_1 = require("../../tools/test-run-fetcher");
+const zod_schema_1 = require("../../tools/zod-schema");
+const prompt_1 = require("./prompt");
+const tools = [
+    test_run_1.runTestTool,
+    test_gen_browser_1.generateTestWithBrowserAgent,
+    diagnosis_fetcher_1.diagnosisTool,
+    grep_1.grepTool,
+    test_run_fetcher_1.testRunTool,
+];
+const toolExecutors = {
+    ...Object.fromEntries(tools.map((tool) => [tool.schema.name, tool.execute])),
+    str_replace_editor: (input) => (0, chat_1.strReplaceEditorTool)(input, web_1.validateTypescript),
+};
+function createChatModel(useDiskForChatState, selectedModel) {
+    if (selectedModel.startsWith("claude")) {
+        return new chat_1.ClaudeChatModel(useDiskForChatState);
+    }
+    if (selectedModel.startsWith("gemini")) {
+        return new chat_1.GeminiChatModel();
+    }
+    throw new Error(`Unsupported model: ${selectedModel}`);
+}
+function getModelName(model) {
+    if (model.startsWith("claude"))
+        return "Claude";
+    if (model.startsWith("gemini"))
+        return "Gemini";
+    return "AI";
+}
+function concludeAgent(usageSummary) {
+    console.log(`\n${(0, picocolors_1.gray)("Usage summary -> " + usageSummary)}`);
+    (0, chat_1.cleanupBackupFiles)(process.cwd());
+}
+async function chatAgent({ selectedModel = "claude-3-7-sonnet-20250219", useDiskForChatState = false, }) {
+    let chatModel = createChatModel(useDiskForChatState, selectedModel);
+    let userPrompt = undefined;
+    const handleSigInt = () => {
+        concludeAgent(chatModel.getUsageSummary());
+        process.exit(0);
+    };
+    process.once("SIGINT", handleSigInt);
+    process.once("SIGTERM", handleSigInt);
+    const ora = (await import("ora")).default;
+    if (chatModel.askUserForInput) {
+        // Show last message to the user for context when we loaded from disk
+        const latest = chatModel.getHumanReadableLatestMessage();
+        if (latest) {
+            console.log(`${latest.role}: ${latest.textMessage}`);
+        }
+    }
+    const systemPrompt = await (0, prompt_1.buildSystemPrompt)();
+    while (!userPrompt?.toLowerCase().includes("stop")) {
+        if (chatModel.askUserForInput) {
+            try {
+                userPrompt = await human_in_the_loop_1.humanLoop.getFeedback({
+                    message: "User:",
+                });
+            }
+            catch (e) {
+                // https://github.com/SBoudrias/Inquirer.js/issues/1502#issuecomment-2275991680
+                if (e instanceof Error && e.name === "ExitPromptError") {
+                    concludeAgent(chatModel.getUsageSummary());
+                    process.exit(0);
+                }
+                throw e;
+            }
+            chatModel.pushUserMessage(userPrompt);
+            continue;
+        }
+        const toolUse = chatModel.getPendingToolCall();
+        if (toolUse) {
+            const spinner = ora(`Executing tool ${toolUse.name} with args: ${JSON.stringify(toolUse.input)}`).start();
+            const toolExecutor = toolExecutors[toolUse.name];
+            if (!toolExecutor) {
+                throw new Error(`Tool ${toolUse.name} not found`);
+            }
+            const toolResult = await toolExecutor(toolUse.input);
+            if (toolResult.isError) {
+                spinner.fail(`Tool ${toolUse.name} failed with error: ${toolResult.result}`);
+            }
+            else {
+                spinner.succeed(`Tool ${toolUse.name} completed`);
+            }
+            chatModel.pushMessage({
+                role: "user",
+                content: [
+                    {
+                        type: "tool_result",
+                        tool_use_id: toolUse.id,
+                        content: toolResult.result,
+                        is_error: toolResult.isError,
+                    },
+                ],
+            });
+            continue;
+        }
+        const spinner = ora(`${getModelName(selectedModel)} is working...`).start();
+        const response = await chatModel.getLLMResponse({
+            systemPrompt,
+            tools: tools.map((tool) => (0, zod_schema_1.zodToOpenAITool)(tool.schema)),
+            selectedModel,
+        });
+        spinner.stop();
+        if (!response) {
+            throw new Error("No response from LLM");
+        }
+        chatModel.pushMessage(response);
+        const latest = chatModel.getHumanReadableLatestMessage();
+        if (latest) {
+            console.log(`${latest.role}: ${latest.textMessage}`);
+        }
+    }
+    const usageSummary = chatModel.getUsageSummary();
+    concludeAgent(usageSummary);
+    return usageSummary;
+}
+exports.chatAgent = chatAgent;

package/dist/agent/chat/prompt.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export declare function buildSystemPrompt(): Promise<string>;
2	+ //# sourceMappingURL=prompt.d.ts.map

package/dist/agent/chat/prompt.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"prompt.d.ts","sourceRoot":"","sources":["../../../src/agent/chat/prompt.ts"],"names":[],"mappings":"AAEA,wBAAsB,iBAAiB,oBAoEtC"}

package/dist/agent/chat/prompt.js ADDED Viewed

@@ -0,0 +1,74 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.buildSystemPrompt = void 0;
+const repo_1 = require("./repo");
+async function buildSystemPrompt() {
+    const repoContext = await (0, repo_1.getRepoContext)();
+    return `
+You are a helpful assistant that can answer questions and help with tasks related to writing
+and maintaining Playwright tests.
+# Supported capabilities
+- Adding new Playwright tests or helper methods
+- Going through test reports and identifying app issues versus test issues
+- Modifying existing tests
+- Modifying repo configuration (e.g. in playwright.config.ts and other)
+# Going through test reports
+- App issues: app issues caught by test failures, like UI issues, API endpoint issues, etc. These are issues that
+will be reported to an app developer to investigate and fix.
+- Test issues: Playwright tests can become outdated when app code changes. These are issues that need to be
+fixed with modifications to the test code, and it is your job to do that.
+# Tools
+You are given a set of tools to help you fulfill the user's request. Read their descriptions to
+understand what each tool does.
+For example, if the user asks you to run a test, you could use the runTest tool.
+Once the test is run, you will receive the results in the form of a JSON object.
+Summarize the results in a few sentences.
+If the user provides a diagnosis URL, you can use the fetchDiagnosisDetails tool
+to get more information about the test case and its results.
+If the user provides a test run URL, you can use the fetchTestRunDetails tool
+to get detailed information about a specific test run.
+Or if the user asks you to modify a test, you could use the generateTestWithBrowserAgent tool. If you suspect
+that a UI selector needs to be updated, using the browser agent is a good idea.
+Before using generateTestWithBrowserAgent, you need to prepare the test code for the browser agent.
+You can do this by using the str_replace_editor tool to add a TODO comment to the test code. This
+comment should explain to the browser agent what to do.
+For example, if the expected modification is to click on a login button, you could add the following comment.
+// TODO(agent): Click on the login button
+The position of the comment is important: the browser agent will look for this comment and replace it with
+the actual code to click on the login button. If you are fixing a failing test, your comment should be
+around the failing line of code, so that it can be replaced/modified.
+# Rules for fixing Playwright tests
+You must follow these rules while adding new tests or modifying existing tests. There can be exceptions to these rules, but
+ONLY when explicitly asked for by the user.
+1. Do not add any conditional logic or try catch blocks in a test. A good test deterministically tests a user scenario
+2. Trust Playwright's ability to auto-wait while taking actions on elements. For example, do not add checks on locator.isVisible() before clicking on it: Playwright already does this
+3. Do not add waitForTimeout or waitForLoadState in a test. Playwright will automatically wait for the page to load.
+4. You can't delete some steps from the test to make it pass. The test needs to accomplish its objective (which is to validate a particular user scenario)
+# Proactiveness
+You are allowed to be proactive, but ONLY for read-only actions, like searching for content, reading files, fetching data from tools, and
+running Playwright tests. For any read-write actions (e.g. modifying any file), you should share your plan and get the user's approval before proceeding.
+# Repo context
+${repoContext}
+`;
+}
+exports.buildSystemPrompt = buildSystemPrompt;

package/dist/agent/chat/repo.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export declare function getRepoContext(): Promise<string>;
2	+ //# sourceMappingURL=repo.d.ts.map

package/dist/agent/chat/repo.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"repo.d.ts","sourceRoot":"","sources":["../../../src/agent/chat/repo.ts"],"names":[],"mappings":"AAmCA,wBAAsB,cAAc,oBAwBnC"}

package/dist/agent/chat/repo.js ADDED Viewed

@@ -0,0 +1,64 @@
+"use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.getRepoContext = void 0;
+const fs_extra_1 = __importDefault(require("fs-extra"));
+const path_1 = __importDefault(require("path"));
+const repo_tree_1 = require("../../utils/repo-tree");
+async function getAllMarkdownFiles() {
+    const dir = path_1.default.join(process.cwd(), ".empiricalrun");
+    if (!fs_extra_1.default.existsSync(dir)) {
+        return [];
+    }
+    const files = await fs_extra_1.default.readdir(dir);
+    return files
+        .filter((file) => file.endsWith(".md"))
+        .map((file) => {
+        return {
+            name: file,
+            content: fs_extra_1.default.readFileSync(path_1.default.join(dir, file), "utf8"),
+        };
+    });
+}
+async function knowledgeContext() {
+    const mdFiles = await getAllMarkdownFiles();
+    const knowledge = mdFiles.map((file) => {
+        return `
+    <knowledge_file>
+    <file_name>${file.name}</file_name>
+    <file_content>
+    ${file.content}
+    </file_content>
+    </knowledge_file>
+    `;
+    });
+    return knowledge.join("\n");
+}
+async function getRepoContext() {
+    let REPO_CONTEXT_PROMPT = `
+You are running as a CLI tool inside the directory of the repo that has Playwright tests.
+Here is the repo directory structure:
+${(0, repo_tree_1.generateAsciiTree)(process.cwd())}
+While specifying paths to files, use relative paths from the current working directory. For example:
+- Correct path: "tests/lesson.spec.ts"
+- Incorrect path: "/repo/tests/lesson.spec.ts" or "${path_1.default.basename(process.cwd())}/tests/lesson.spec.ts"
+`;
+    const knowledge = await knowledgeContext();
+    if (knowledge.length > 0) {
+        REPO_CONTEXT_PROMPT += `
+## Repo-specific knowledge
+You can use the following knowledge with your tasks.
+<knowledge>
+${knowledge}
+</knowledge>
+`;
+    }
+    return REPO_CONTEXT_PROMPT;
+}
+exports.getRepoContext = getRepoContext;

package/dist/agent/cua/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/agent/cua/index.ts"],"names":[],"mappings":"~~AAEA~~,OAAO,EAAE,IAAI,EAAE,MAAM,YAAY,CAAC;~~AAWlC~~,wBAAsB,sBAAsB,CAAC,IAAI,EAAE,IAAI,iBAoBtD;AAED;;GAEG;AACH,wBAAsB,+BAA+B,CAAC,EACpD,IAAI,EACJ,IAAI,GACL,EAAE;IACD,IAAI,EAAE,IAAI,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;CACd,GAAG,OAAO,CAAC;IACV,IAAI,EAAE,MAAM,CAAC;IACb,WAAW,EAAE,MAAM,EAAE,CAAC;CACvB,CAAC,~~CAmGD~~"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/agent/cua/index.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,IAAI,EAAE,MAAM,YAAY,CAAC;AAMlC,wBAAsB,sBAAsB,CAAC,IAAI,EAAE,IAAI,iBAoBtD;AAED;;GAEG;AACH,wBAAsB,+BAA+B,CAAC,EACpD,IAAI,EACJ,IAAI,GACL,EAAE;IACD,IAAI,EAAE,IAAI,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;CACd,GAAG,OAAO,CAAC;IACV,IAAI,EAAE,MAAM,CAAC;IACb,WAAW,EAAE,MAAM,EAAE,CAAC;CACvB,CAAC,CAkFD"}

package/dist/agent/cua/index.js CHANGED Viewed

@@ -1,17 +1,9 @@
 "use strict";
-var __importDefault = (this && this.__importDefault) || function (mod) {
-    return (mod && mod.__esModule) ? mod : { "default": mod };
-};
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.createTestUsingComputerUseAgent = exports.startPlaywrightCodegen = void 0;
-const openai_1 = __importDefault(require("openai"));
 const utils_1 = require("../browsing/utils");
 const computer_1 = require("./computer");
-const INSTRUCTIONS = `You will be asked to execute some actions in a browser context.
-Don't ask the user for confirmations - just execute the actions.
-For example, if the user message says "Click on Submit button", then
-you click on the submit button -- even if it looks like a scary action.`;
+const model_1 = require("./model");
 async function startPlaywrightCodegen(page) {
     // TODO: Use this method to offload code generation to Playwright
     // Unclear how to retrieve source code that is generated
@@ -44,18 +36,7 @@ async function createTestUsingComputerUseAgent({ page, task, }) {
     const viewport = page.viewportSize();
     let screenWidth = viewport?.width || 1280;
     let screenHeight = viewport?.height || 720;
-    const openai = new openai_1.default();
-    let response = await openai.responses.create({
-        model: "computer-use-preview",
-        tools: [
-            {
-                type: "computer-preview",
-                display_width: screenWidth,
-                display_height: screenHeight,
-                environment: "browser",
-            },
-        ],
-        instructions: INSTRUCTIONS,
+    let response = await (0, model_1.callComputerUseModel)({
         input: [
             {
                 role: "user",
@@ -72,7 +53,8 @@ async function createTestUsingComputerUseAgent({ page, task, }) {
                 ],
             },
         ],
-        truncation: "auto",
+        screenWidth,
+        screenHeight,
     });
     // eslint-disable-next-line no-constant-condition
     while (true) {
@@ -92,6 +74,7 @@ async function createTestUsingComputerUseAgent({ page, task, }) {
         const computerCall = computerCalls[0];
         const lastCallId = computerCall.call_id;
         const action = computerCall.action;
+        const pendingSafetyChecks = computerCall.pending_safety_checks;
         // Execute the action (function defined in step 3)
         const actionCode = await (0, computer_1.handleModelAction)(page, action);
         generatedCode += actionCode;
@@ -99,18 +82,8 @@ async function createTestUsingComputerUseAgent({ page, task, }) {
         // Take a screenshot after the action (function defined in step 4)
         const screenshotBytes = await (0, computer_1.getScreenshot)(page);
         // Send the screenshot back as a computer_call_output
-        response = await openai.responses.create({
-            model: "computer-use-preview",
-            previous_response_id: response.id,
-            tools: [
-                {
-                    type: "computer-preview",
-                    display_width: screenWidth,
-                    display_height: screenHeight,
-                    environment: "browser",
-                },
-            ],
-            instructions: INSTRUCTIONS,
+        response = await (0, model_1.callComputerUseModel)({
+            previousResponseId: response.id,
             input: [
                 {
                     call_id: lastCallId,
@@ -119,9 +92,11 @@ async function createTestUsingComputerUseAgent({ page, task, }) {
                         type: "computer_screenshot",
                         image_url: `data:image/png;base64,${screenshotBytes}`,
                     },
+                    acknowledged_safety_checks: pendingSafetyChecks,
                 },
             ],
-            truncation: "auto",
+            screenWidth,
+            screenHeight,
         });
     }
     return {

package/dist/agent/cua/model.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+import { Response, ResponseInput } from "openai/resources/responses/responses.mjs";
+export declare function callComputerUseModel({ input, previousResponseId, screenWidth, screenHeight, }: {
+    input: ResponseInput;
+    previousResponseId?: string;
+    screenWidth: number;
+    screenHeight: number;
+}): Promise<Response>;
+//# sourceMappingURL=model.d.ts.map

package/dist/agent/cua/model.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"model.d.ts","sourceRoot":"","sources":["../../../src/agent/cua/model.ts"],"names":[],"mappings":"AACA,OAAO,EACL,QAAQ,EACR,aAAa,EACd,MAAM,0CAA0C,CAAC;AAQlD,wBAAsB,oBAAoB,CAAC,EACzC,KAAK,EACL,kBAAkB,EAClB,WAAW,EACX,YAAY,GACb,EAAE;IACD,KAAK,EAAE,aAAa,CAAC;IACrB,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAC5B,WAAW,EAAE,MAAM,CAAC;IACpB,YAAY,EAAE,MAAM,CAAC;CACtB,GAAG,OAAO,CAAC,QAAQ,CAAC,CAqBpB"}

package/dist/agent/cua/model.js ADDED Viewed

@@ -0,0 +1,35 @@
+"use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.callComputerUseModel = void 0;
+const openai_1 = __importDefault(require("openai"));
+const INSTRUCTIONS = `You will be asked to execute some actions in a browser context.
+Don't ask the user for confirmations - just execute the actions.
+For example, if the user message says "Click on Submit button", then
+you click on the submit button -- even if it looks like a scary action.`;
+async function callComputerUseModel({ input, previousResponseId, screenWidth, screenHeight, }) {
+    const openai = new openai_1.default();
+    return await openai.responses.create({
+        model: "computer-use-preview",
+        previous_response_id: previousResponseId,
+        tools: [
+            {
+                type: "computer-preview",
+                display_width: screenWidth,
+                display_height: screenHeight,
+                environment: "browser",
+            },
+        ],
+        reasoning: {
+            effort: "medium",
+            generate_summary: "concise",
+        },
+        instructions: INSTRUCTIONS,
+        input,
+        truncation: "auto",
+    });
+}
+exports.callComputerUseModel = callComputerUseModel;

package/dist/bin/index.js CHANGED Viewed

@@ -41,12 +41,13 @@ async function runChatAgent(modelInput, useDiskForChatState) {
         "3-7": "claude-3-7-sonnet-20250219",
         "claude-3-5": "claude-3-5-sonnet-20241022",
         "3-5": "claude-3-5-sonnet-20241022",
+        "gemini-2.5-pro-exp-03-25": "gemini-2.5-pro-exp-03-25",
     };
     if (modelInput && !MODEL_MAPPING[modelInput]) {
         throw new Error(`Invalid chat model: ${modelInput}`);
     }
     return await (0, chat_1.chatAgent)({
-        chatModel: modelInput ? MODEL_MAPPING[modelInput] : undefined,
+        selectedModel: modelInput ? MODEL_MAPPING[modelInput] : undefined,
         useDiskForChatState,
     });
 }
@@ -186,7 +187,7 @@ async function runAgentsWorkflow(testGenConfig, testGenToken) {
         .option("--suites <suites>", "Comma separated list of describe blocks")
         .option("--use-chat", "Use chat agent (and not the workflow)")
         .option("--use-disk-for-chat-state", "Save and load chat state from disk")
-        .option("--chat-model <model>", "Chat model to use (claude-3-7-sonnet-20250219 or claude-3-5-sonnet-20241022)")
+        .option("--chat-model <model>", "Chat model to use (claude-3-7-sonnet-20250219 or claude-3-5-sonnet-20241022 or gemini-2.5-pro-exp-03-25)")
         .parse(process.argv);
     const options = program.opts();
     const completedOptions = await (0, utils_2.validateAndCompleteCliOptions)(options);

package/dist/bin/logger/index.js CHANGED Viewed

@@ -1,9 +1,9 @@
 "use strict";
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.waitForLogsToFlush = exports.CustomLogger = void 0;
-const reporter_1 = require("@empiricalrun/reporter");
 const picocolors_1 = require("picocolors");
-const reporter_2 = require("../../reporter");
+const reporter_1 = require("../../reporter");
+const lib_1 = require("../../reporter/lib");
 let queuedReporterMessages = [];
 class CustomLogger {
     useReporter = false;
@@ -13,7 +13,7 @@ class CustomLogger {
     logToReporter(message) {
         if (this.useReporter) {
             (() => {
-                const promise = (0, reporter_2.getReporter)()?.report(new reporter_1.ProcessLogMessageBuilder({ type: "message", message: message }));
+                const promise = (0, reporter_1.getReporter)()?.report(new lib_1.MessageBuilder({ type: "message", message: message }));
                 if (promise) {
                     queuedReporterMessages.push(promise);
                 }

package/dist/bin/utils/index.d.ts CHANGED Viewed

@@ -6,7 +6,7 @@ export interface CliOptions {
     suites?: string;
     useChat?: boolean;
     useDiskForChatState?: boolean;
-    chatModel?: "claude-3-7" | "3-7" | "claude-3-5" | "3-5" | "claude-3-7-sonnet-20250219" | "claude-3-5-sonnet-20241022";
+    chatModel?: "claude-3-7" | "3-7" | "claude-3-5" | "3-5" | "claude-3-7-sonnet-20250219" | "claude-3-5-sonnet-20241022" | "gemini-2.5-pro-exp-03-25";
 }
 export declare function validateAndCompleteCliOptions(options: CliOptions): Promise<CliOptions>;
 //# sourceMappingURL=index.d.ts.map

package/dist/bin/utils/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/bin/utils/index.ts"],"names":[],"mappings":"AAEA,MAAM,WAAW,UAAU;IACzB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB,mBAAmB,CAAC,EAAE,OAAO,CAAC;IAC9B,SAAS,CAAC,EACN,YAAY,GACZ,KAAK,GACL,YAAY,GACZ,KAAK,GACL,4BAA4B,GAC5B,4BAA4B,CAAC;~~CAClC~~;AAQD,wBAAsB,6BAA6B,CACjD,OAAO,EAAE,UAAU,GAClB,OAAO,CAAC,UAAU,CAAC,CAyDrB"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/bin/utils/index.ts"],"names":[],"mappings":"AAEA,MAAM,WAAW,UAAU;IACzB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB,mBAAmB,CAAC,EAAE,OAAO,CAAC;IAC9B,SAAS,CAAC,EACN,YAAY,GACZ,KAAK,GACL,YAAY,GACZ,KAAK,GACL,4BAA4B,GAC5B,4BAA4B,GAC5B,0BAA0B,CAAC;CAChC;AAQD,wBAAsB,6BAA6B,CACjD,OAAO,EAAE,UAAU,GAClB,OAAO,CAAC,UAAU,CAAC,CAyDrB"}

package/dist/bin/utils/platform/web/index.d.ts CHANGED Viewed

@@ -18,6 +18,11 @@ export declare function getTypescriptTestBlock({ scenarioName, suites, content,
     testNode: Node | undefined;
     testAlias: string;
 };
+export declare function hasTestBlock({ testName, testSuites, filePath, }: {
+    testName: string;
+    testSuites: string[];
+    filePath: string;
+}): boolean;
 export declare function hasTopLevelDescribeConfigureWithSerialMode(filePath: string): Promise<boolean>;
 /**
  * Function to find the first 'describe' block configured with 'serial: true'

package/dist/bin/utils/platform/web/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../../../src/bin/utils/platform/web/index.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,WAAW,EAAE,MAAM,mBAAmB,CAAC;AAChD,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,4BAA4B,CAAC;AAK3D,OAAO,EAGL,IAAI,EAEJ,UAAU,EAEX,MAAM,UAAU,CAAC;AAIlB,eAAO,MAAM,gCAAgC,eAC/B,UAAU,KACrB,MAgBF,CAAC;AAEF;;;;;;GAMG;AACH,wBAAgB,sBAAsB,CAAC,EACrC,YAAY,EACZ,MAAM,EACN,OAAO,GACR,EAAE;IACD,YAAY,EAAE,MAAM,CAAC;IACrB,MAAM,CAAC,EAAE,MAAM,EAAE,CAAC;IAClB,OAAO,EAAE,MAAM,CAAC;CACjB,GAAG;IACF,SAAS,EAAE,MAAM,GAAG,SAAS,CAAC;IAC9B,QAAQ,EAAE,IAAI,GAAG,SAAS,CAAC;IAC3B,SAAS,EAAE,MAAM,CAAC;CACnB,CA2CA;AAwBD,wBAAsB,0CAA0C,CAC9D,QAAQ,EAAE,MAAM,oBA+BjB;AAED;;;;;;;;;;;;;;;;;;;;;;GAsBG;AACH,wBAAgB,4BAA4B,CAC1C,IAAI,EAAE,IAAI,GAAG,SAAS,GACrB,IAAI,GAAG,SAAS,CA4BlB;AAED,wBAAgB,iBAAiB,CAAC,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,MAAM,CAG5E;AAED,wBAAgB,kBAAkB,CAAC,QAAQ,EAAE,MAAM,GAAG,MAAM,EAAE,CA8C7D;AAED,wBAAsB,sBAAsB,CAC1C,OAAO,EAAE,MAAM,EACf,QAAQ,EAAE,MAAM,mCAWjB;AAED,wBAAsB,UAAU,CAAC,QAAQ,EAAE,MAAM,iBAShD;AAED,wBAAsB,UAAU,CAAC,QAAQ,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,WAAW,iBAgBrE;AAED,wBAAgB,YAAY,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,EAAE,GAAG,EAAE,MAAM,UAE5E;AAED,wBAAsB,cAAc,CAAC,QAAQ,EAAE,MAAM,iBAMpD;AAED,wBAAgB,oBAAoB,CAAC,QAAQ,EAAE,MAAM,UAcpD;AAED,wBAAsB,iCAAiC,CAAC,QAAQ,EAAE,MAAM,+BAoBvE;AA+CD,wBAAgB,4BAA4B,CAC1C,QAAQ,EAAE,MAAM,EAChB,QAAQ,EAAE,MAAM,EAChB,aAAa,EAAE,MAAM,UAoCtB;AAED,eAAO,MAAM,6BAA6B;qBAKvB,MAAM;iBACV,MAAM;YACX,MAAM,EAAE;YA2DjB,CAAC;AAEF,eAAO,MAAM,iCAAiC,YACnC,MAAM,aACJ,MAAM,EAAE,gBACL,MAAM,sBAyBrB,CAAC;AAEF,wBAAsB,qBAAqB,CAAC,EAC1C,YAAY,EACZ,QAAQ,EACR,MAAM,GACP,EAAE;IACD,YAAY,EAAE,MAAM,CAAC;IACrB,QAAQ,EAAE,MAAM,CAAC;IACjB,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB,iBAgDA;AAED,wBAAsB,uBAAuB,CAC3C,QAAQ,EAAE,MAAM,EAChB,cAAc,EAAE,MAAM,EAAE,iBAsBzB;AAED,wBAAgB,aAAa,CAAC,EAC5B,QAAQ,EACR,QAAQ,GACT,EAAE;IACD,QAAQ,EAAE,MAAM,CAAC;IACjB,QAAQ,EAAE,QAAQ,CAAC;CACpB,WAYA;AAED,wBAAgB,mBAAmB,CAAC,EAClC,QAAQ,EACR,MAAM,GACP,EAAE;IACD,QAAQ,EAAE,MAAM,CAAC;IACjB,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB,UAOA;AAED,wBAAgB,+BAA+B,CAAC,UAAU,EAAE,MAAM,GAAG,MAAM,EAAE,CA4B5E;AAED,wBAAgB,aAAa,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAQnD"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../../../src/bin/utils/platform/web/index.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,WAAW,EAAE,MAAM,mBAAmB,CAAC;AAChD,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,4BAA4B,CAAC;AAK3D,OAAO,EAGL,IAAI,EAEJ,UAAU,EAEX,MAAM,UAAU,CAAC;AAIlB,eAAO,MAAM,gCAAgC,eAC/B,UAAU,KACrB,MAgBF,CAAC;AAEF;;;;;;GAMG;AACH,wBAAgB,sBAAsB,CAAC,EACrC,YAAY,EACZ,MAAM,EACN,OAAO,GACR,EAAE;IACD,YAAY,EAAE,MAAM,CAAC;IACrB,MAAM,CAAC,EAAE,MAAM,EAAE,CAAC;IAClB,OAAO,EAAE,MAAM,CAAC;CACjB,GAAG;IACF,SAAS,EAAE,MAAM,GAAG,SAAS,CAAC;IAC9B,QAAQ,EAAE,IAAI,GAAG,SAAS,CAAC;IAC3B,SAAS,EAAE,MAAM,CAAC;CACnB,CA2CA;AAED,wBAAgB,YAAY,CAAC,EAC3B,QAAQ,EACR,UAAU,EACV,QAAQ,GACT,EAAE;IACD,QAAQ,EAAE,MAAM,CAAC;IACjB,UAAU,EAAE,MAAM,EAAE,CAAC;IACrB,QAAQ,EAAE,MAAM,CAAC;CAClB,WAUA;AAwBD,wBAAsB,0CAA0C,CAC9D,QAAQ,EAAE,MAAM,oBA+BjB;AAED;;;;;;;;;;;;;;;;;;;;;;GAsBG;AACH,wBAAgB,4BAA4B,CAC1C,IAAI,EAAE,IAAI,GAAG,SAAS,GACrB,IAAI,GAAG,SAAS,CA4BlB;AAED,wBAAgB,iBAAiB,CAAC,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,MAAM,CAG5E;AAED,wBAAgB,kBAAkB,CAAC,QAAQ,EAAE,MAAM,GAAG,MAAM,EAAE,CA8C7D;AAED,wBAAsB,sBAAsB,CAC1C,OAAO,EAAE,MAAM,EACf,QAAQ,EAAE,MAAM,mCAWjB;AAED,wBAAsB,UAAU,CAAC,QAAQ,EAAE,MAAM,iBAShD;AAED,wBAAsB,UAAU,CAAC,QAAQ,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,WAAW,iBAgBrE;AAED,wBAAgB,YAAY,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,EAAE,GAAG,EAAE,MAAM,UAE5E;AAED,wBAAsB,cAAc,CAAC,QAAQ,EAAE,MAAM,iBAMpD;AAED,wBAAgB,oBAAoB,CAAC,QAAQ,EAAE,MAAM,UAcpD;AAED,wBAAsB,iCAAiC,CAAC,QAAQ,EAAE,MAAM,+BAoBvE;AA+CD,wBAAgB,4BAA4B,CAC1C,QAAQ,EAAE,MAAM,EAChB,QAAQ,EAAE,MAAM,EAChB,aAAa,EAAE,MAAM,UAoCtB;AAED,eAAO,MAAM,6BAA6B;qBAKvB,MAAM;iBACV,MAAM;YACX,MAAM,EAAE;YA2DjB,CAAC;AAEF,eAAO,MAAM,iCAAiC,YACnC,MAAM,aACJ,MAAM,EAAE,gBACL,MAAM,sBAyBrB,CAAC;AAEF,wBAAsB,qBAAqB,CAAC,EAC1C,YAAY,EACZ,QAAQ,EACR,MAAM,GACP,EAAE;IACD,YAAY,EAAE,MAAM,CAAC;IACrB,QAAQ,EAAE,MAAM,CAAC;IACjB,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB,iBAgDA;AAED,wBAAsB,uBAAuB,CAC3C,QAAQ,EAAE,MAAM,EAChB,cAAc,EAAE,MAAM,EAAE,iBAsBzB;AAED,wBAAgB,aAAa,CAAC,EAC5B,QAAQ,EACR,QAAQ,GACT,EAAE;IACD,QAAQ,EAAE,MAAM,CAAC;IACjB,QAAQ,EAAE,QAAQ,CAAC;CACpB,WAYA;AAED,wBAAgB,mBAAmB,CAAC,EAClC,QAAQ,EACR,MAAM,GACP,EAAE;IACD,QAAQ,EAAE,MAAM,CAAC;IACjB,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB,UAOA;AAED,wBAAgB,+BAA+B,CAAC,UAAU,EAAE,MAAM,GAAG,MAAM,EAAE,CA4B5E;AAED,wBAAgB,aAAa,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAQnD"}

package/dist/bin/utils/platform/web/index.js CHANGED Viewed

@@ -3,7 +3,7 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
     return (mod && mod.__esModule) ? mod : { "default": mod };
 };
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.isSyntaxValid = exports.getVariableDeclarationsFromCode = exports.buildTestNamePrompt = exports.isTestPresent = exports.appendScopeToCreateTest = exports.addUserContextFixture = exports.importAllExportsStmtFromFilePaths = exports.injectCodeSnippetBySuiteChain = exports.replaceCreateTestWithNewCode = exports.getPageVariableNameFromCreateTest = exports.getFixtureImportPath = exports.removeTestOnly = exports.addNewImport = exports.formatCode = exports.lintErrors = exports.stripAndPrependImports = exports.validateTypescript = exports.appendToTestBlock = exports.findFirstSerialDescribeBlock = exports.hasTopLevelDescribeConfigureWithSerialMode = exports.getTypescriptTestBlock = exports.getTestModuleAliasFromSourceFile = void 0;
+exports.isSyntaxValid = exports.getVariableDeclarationsFromCode = exports.buildTestNamePrompt = exports.isTestPresent = exports.appendScopeToCreateTest = exports.addUserContextFixture = exports.importAllExportsStmtFromFilePaths = exports.injectCodeSnippetBySuiteChain = exports.replaceCreateTestWithNewCode = exports.getPageVariableNameFromCreateTest = exports.getFixtureImportPath = exports.removeTestOnly = exports.addNewImport = exports.formatCode = exports.lintErrors = exports.stripAndPrependImports = exports.validateTypescript = exports.appendToTestBlock = exports.findFirstSerialDescribeBlock = exports.hasTopLevelDescribeConfigureWithSerialMode = exports.hasTestBlock = exports.getTypescriptTestBlock = exports.getTestModuleAliasFromSourceFile = void 0;
 const parser_1 = require("@babel/parser");
 const eslint_1 = require("eslint");
 const fs_extra_1 = __importDefault(require("fs-extra"));
@@ -72,6 +72,18 @@ function getTypescriptTestBlock({ scenarioName, suites, content, }) {
     };
 }
 exports.getTypescriptTestBlock = getTypescriptTestBlock;
+function hasTestBlock({ testName, testSuites, filePath, }) {
+    if (!fs_extra_1.default.existsSync(filePath)) {
+        return false;
+    }
+    const { testBlock } = getTypescriptTestBlock({
+        scenarioName: testName,
+        content: fs_extra_1.default.readFileSync(filePath, "utf-8"),
+        suites: testSuites,
+    });
+    return Boolean(testBlock);
+}
+exports.hasTestBlock = hasTestBlock;
 // get the names of parent describe blocks
 function getParentDescribeNames(node) {
     const names = [];

package/dist/reporter/index.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { Reporter } from "@empiricalrun/reporter";
+import { Reporter } from "./lib";
 type ReporterConfigType = {
     testSessionId: number;
     generationId: number;

package/dist/reporter/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/reporter/index.ts"],"names":[],"mappings":"~~AACA~~,OAAO,~~EAA4B~~,QAAQ,EAAE,MAAM,~~wBAAwB~~,CAAC;~~AAa5E~~,KAAK,kBAAkB,GAAG;IACxB,aAAa,EAAE,MAAM,CAAC;IACtB,YAAY,EAAE,MAAM,CAAC;IACrB,eAAe,EAAE,MAAM,CAAC;CACzB,CAAC;AAKF,wBAAgB,WAAW,IAAI,QAAQ,GAAG,SAAS,CAUlD;AAED;;;GAGG;AACH,wBAAgB,iBAAiB,CAAC,MAAM,EAAE,kBAAkB,GAAG,IAAI,CAGlE;AAED,qBAAa,sBAAsB;IACjC,OAAO,CAAC,OAAO,CAAS;;IAKlB,eAAe,CAAC,EACpB,eAAe,EACf,QAAQ,GACT,EAAE;QACD,eAAe,EAAE,MAAM,CAAC;QACxB,QAAQ,EAAE,MAAM,CAAC;KAClB;IAgDK,eAAe,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IA8C9C,WAAW,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAY3C,UAAU,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAY1C,iBAAiB,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;CAWxD"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/reporter/index.ts"],"names":[],"mappings":"AAYA,OAAO,EAAkB,QAAQ,EAAE,MAAM,OAAO,CAAC;AAEjD,KAAK,kBAAkB,GAAG;IACxB,aAAa,EAAE,MAAM,CAAC;IACtB,YAAY,EAAE,MAAM,CAAC;IACrB,eAAe,EAAE,MAAM,CAAC;CACzB,CAAC;AAKF,wBAAgB,WAAW,IAAI,QAAQ,GAAG,SAAS,CAUlD;AAED;;;GAGG;AACH,wBAAgB,iBAAiB,CAAC,MAAM,EAAE,kBAAkB,GAAG,IAAI,CAGlE;AAED,qBAAa,sBAAsB;IACjC,OAAO,CAAC,OAAO,CAAS;;IAKlB,eAAe,CAAC,EACpB,eAAe,EACf,QAAQ,GACT,EAAE;QACD,eAAe,EAAE,MAAM,CAAC;QACxB,QAAQ,EAAE,MAAM,CAAC;KAClB;IAgDK,eAAe,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IA8C9C,WAAW,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAY3C,UAAU,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAY1C,iBAAiB,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;CAWxD"}

package/dist/reporter/index.js CHANGED Viewed

@@ -5,11 +5,11 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.TestGenUpdatesReporter = exports.setReporterConfig = exports.getReporter = void 0;
 const r2_uploader_1 = require("@empiricalrun/r2-uploader");
-const reporter_1 = require("@empiricalrun/reporter");
 const fs_extra_1 = __importDefault(require("fs-extra"));
 const path_1 = __importDefault(require("path"));
 const logger_1 = require("../bin/logger");
 const uploader_1 = require("../uploader");
+const lib_1 = require("./lib");
 let reporterInstance = undefined;
 let reporterConfig = undefined;
 function getReporter() {
@@ -19,7 +19,7 @@ function getReporter() {
     }
     // initialise once config is set
     if (!reporterInstance && reporterConfig) {
-        reporterInstance = new reporter_1.Reporter(reporterConfig);
+        reporterInstance = new lib_1.Reporter(reporterConfig);
     }
     return reporterInstance;
 }
@@ -55,7 +55,7 @@ class TestGenUpdatesReporter {
             await Promise.allSettled([
                 ...(videoUrls.length
                     ? [
-                        reporter?.report(new reporter_1.ProcessLogMessageBuilder({
+                        reporter?.report(new lib_1.MessageBuilder({
                             type: "video",
                             message: JSON.stringify({
                                 type: "video",
@@ -66,7 +66,7 @@ class TestGenUpdatesReporter {
                     : []),
                 ...(traceFiles.length
                     ? [
-                        reporter?.report(new reporter_1.ProcessLogMessageBuilder({
+                        reporter?.report(new lib_1.MessageBuilder({
                             type: "pw-trace",
                             message: JSON.stringify({
                                 type: "trace",
@@ -107,7 +107,7 @@ class TestGenUpdatesReporter {
             const filePath = Object.keys(files)[0];
             const relativeFilePath = filePath.replace(path_1.default.join(this.repoDir, "gen-assets"), "");
             const url = `${uploader_1.UPLOAD_DOMAIN}/${uploadDir}${relativeFilePath}`;
-            await getReporter()?.report(new reporter_1.ProcessLogMessageBuilder({
+            await getReporter()?.report(new lib_1.MessageBuilder({
                 type: "current-snapshot",
                 message: JSON.stringify({ type: "current-view", url }),
             }));
@@ -122,7 +122,7 @@ class TestGenUpdatesReporter {
     async sendMessage(message) {
         const reporter = getReporter();
         if (reporter) {
-            await reporter.report(new reporter_1.ProcessLogMessageBuilder({
+            await reporter.report(new lib_1.MessageBuilder({
                 type: "message",
                 message,
             }));
@@ -131,7 +131,7 @@ class TestGenUpdatesReporter {
     async sendLogUrl(message) {
         const reporter = getReporter();
         if (reporter) {
-            await reporter.report(new reporter_1.ProcessLogMessageBuilder({
+            await reporter.report(new lib_1.MessageBuilder({
                 type: "log-url",
                 message,
             }));
@@ -140,7 +140,7 @@ class TestGenUpdatesReporter {
     async sendAgentTraceUrl(message) {
         const reporter = getReporter();
         if (reporter) {
-            await reporter.report(new reporter_1.ProcessLogMessageBuilder({
+            await reporter.report(new lib_1.MessageBuilder({
                 type: "agent-trace",
                 message,
             }));

package/dist/reporter/lib.d.ts ADDED Viewed

@@ -0,0 +1,31 @@
+type DashboardMessagePayload = {
+    message: string;
+    messageType: "message" | "agent-trace" | "current-snapshot" | "video" | "pw-trace" | "log-url" | "commit-id";
+    pull_request?: string;
+    testCaseName?: string;
+    testCaseId?: number;
+    projectRepoName?: string;
+    testSessionId?: number;
+    generationId?: number;
+};
+export declare class MessageBuilder {
+    private props;
+    constructor(props: {
+        message: string;
+        type: DashboardMessagePayload["messageType"];
+    });
+    buildMessage(dashboardOptions?: {
+        override?: Partial<DashboardMessagePayload>;
+    }): DashboardMessagePayload;
+}
+export declare class Reporter {
+    private config;
+    constructor(config: {
+        testSessionId: number;
+        generationId: number;
+    });
+    report(messageBuilder: MessageBuilder): Promise<void>;
+    private sendMessageToDashboard;
+}
+export {};
+//# sourceMappingURL=lib.d.ts.map

package/dist/reporter/lib.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"lib.d.ts","sourceRoot":"","sources":["../../src/reporter/lib.ts"],"names":[],"mappings":"AAMA,KAAK,uBAAuB,GAAG;IAC7B,OAAO,EAAE,MAAM,CAAC;IAChB,WAAW,EACP,SAAS,GACT,aAAa,GACb,kBAAkB,GAClB,OAAO,GACP,UAAU,GACV,SAAS,GACT,WAAW,CAAC;IAChB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,YAAY,CAAC,EAAE,MAAM,CAAC;CACvB,CAAC;AAEF,qBAAa,cAAc;IAEvB,OAAO,CAAC,KAAK;gBAAL,KAAK,EAAE;QACb,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,uBAAuB,CAAC,aAAa,CAAC,CAAC;KAC9C;IAGH,YAAY,CAAC,gBAAgB,CAAC,EAAE;QAC9B,QAAQ,CAAC,EAAE,OAAO,CAAC,uBAAuB,CAAC,CAAC;KAC7C,GAAG,uBAAuB;CAO5B;AAED,qBAAa,QAAQ;IAEjB,OAAO,CAAC,MAAM;gBAAN,MAAM,EAAE;QACd,aAAa,EAAE,MAAM,CAAC;QACtB,YAAY,EAAE,MAAM,CAAC;KACtB;IAGG,MAAM,CAAC,cAAc,EAAE,cAAc,GAAG,OAAO,CAAC,IAAI,CAAC;YAc7C,sBAAsB;CAmCrC"}

package/dist/reporter/lib.js ADDED Viewed

@@ -0,0 +1,72 @@
+"use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.Reporter = exports.MessageBuilder = void 0;
+const async_retry_1 = __importDefault(require("async-retry"));
+const DASHBOARD_DOMAIN = process.env.DASHBOARD_DOMAIN ||
+    (process.env.CI === "true" ? "https://dash.empirical.run" : "");
+class MessageBuilder {
+    props;
+    constructor(props) {
+        this.props = props;
+    }
+    buildMessage(dashboardOptions) {
+        return {
+            ...dashboardOptions?.override,
+            message: this.props.message,
+            messageType: this.props.type,
+        };
+    }
+}
+exports.MessageBuilder = MessageBuilder;
+class Reporter {
+    config;
+    constructor(config) {
+        this.config = config;
+    }
+    async report(messageBuilder) {
+        const message = messageBuilder.buildMessage({
+            override: {
+                testSessionId: this.config.testSessionId,
+                generationId: this.config.generationId,
+            },
+        });
+        if (!message) {
+            console.info("No message found. Skipping sending message to dashboard");
+            return;
+        }
+        await this.sendMessageToDashboard(message);
+    }
+    async sendMessageToDashboard(message) {
+        if (!DASHBOARD_DOMAIN) {
+            console.warn("No dashboard domain found. Skipping send message to dashboard");
+            return;
+        }
+        try {
+            await (0, async_retry_1.default)(async () => {
+                const body = JSON.stringify(message);
+                await fetch(`${DASHBOARD_DOMAIN}/api/github/updates`, {
+                    method: "POST",
+                    headers: {
+                        "Content-Type": "application/json",
+                        // TODO: fix this with authentication of github updates api
+                        Authorization: "weQPMWKT",
+                    },
+                    body,
+                });
+            }, {
+                retries: 3,
+                minTimeout: 1000,
+                maxTimeout: 60000,
+                factor: 3,
+            });
+        }
+        catch (e) {
+            console.error(`Error sending message to Dashboard: ${e.code}`);
+            console.error(e.message);
+        }
+    }
+}
+exports.Reporter = Reporter;

package/dist/tools/test-gen-browser.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"test-gen-browser.d.ts","sourceRoot":"","sources":["../../src/tools/test-gen-browser.ts"],"names":[],"mappings":"~~AAUA~~,OAAO,KAAK,EAAE,IAAI,EAAE,MAAM,SAAS,CAAC;AAmDpC,eAAO,MAAM,4BAA4B,EAAE,~~IAiE1C~~,CAAC"}
1	+ {"version":3,"file":"test-gen-browser.d.ts","sourceRoot":"","sources":["../../src/tools/test-gen-browser.ts"],"names":[],"mappings":"AAWA,OAAO,KAAK,EAAE,IAAI,EAAE,MAAM,SAAS,CAAC;AAmDpC,eAAO,MAAM,4BAA4B,EAAE,IAuE1C,CAAC"}

package/dist/tools/test-gen-browser.js CHANGED Viewed

@@ -4,6 +4,7 @@ exports.generateTestWithBrowserAgent = void 0;
 const zod_1 = require("zod");
 const run_1 = require("../agent/browsing/run");
 const utils_1 = require("../agent/browsing/utils");
+const web_1 = require("../bin/utils/platform/web");
 const scenarios_1 = require("../bin/utils/scenarios");
 const git_1 = require("../utils/git");
 const BrowserAgentSchema = zod_1.z.object({
@@ -65,6 +66,12 @@ exports.generateTestWithBrowserAgent = {
                 result: `Invalid project name: ${project}. Valid project names are: ${validProjectNames.join(", ")}`,
             };
         }
+        if (!(0, web_1.hasTestBlock)({ testName, testSuites, filePath: fileName })) {
+            return {
+                isError: true,
+                result: `Test block not found for test name: "${testName}" in file: "${fileName}" with describe blocks: "${testSuites.join(", ")}"`,
+            };
+        }
         try {
             await (0, utils_1.replaceTodoWithCreateTest)({
                 testCaseName: testName,

package/dist/uploader/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/uploader/index.ts"],"names":[],"mappings":"~~AAWA~~,eAAO,MAAM,aAAa,gBAAgB,CAAC;AAC3C,eAAO,MAAM,aAAa,kCAAkC,CAAC;AAG7D,wBAAgB,iBAAiB,CAC/B,OAAO,EAAE,MAAM,EACf,QAAQ,EAAE,MAAM,EAChB,SAAS,EAAE,MAAM,UAKlB;AAED,wBAAgB,qBAAqB,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,UAEtE;AAED;;;;;;;;;GASG;AACH,wBAAsB,6BAA6B,CAAC,EAClD,eAAe,EACf,QAAQ,EACR,OAAO,GACR,EAAE;IACD,eAAe,EAAE,MAAM,CAAC;IACxB,QAAQ,EAAE,MAAM,CAAC;IACjB,OAAO,EAAE,MAAM,CAAC;CACjB,GAAG,OAAO,CAAC;IACV,SAAS,EAAE,MAAM,EAAE,CAAC;IACpB,UAAU,EAAE,MAAM,CAAC;IACnB,UAAU,EAAE,MAAM,EAAE,CAAC;CACtB,CAAC,CAgED;AAED,wBAAgB,mBAAmB,CAAC,eAAe,EAAE,MAAM,UAM1D;AAED,wBAAgB,2BAA2B,uBAQ1C"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/uploader/index.ts"],"names":[],"mappings":"AAYA,eAAO,MAAM,aAAa,gBAAgB,CAAC;AAC3C,eAAO,MAAM,aAAa,kCAAkC,CAAC;AAG7D,wBAAgB,iBAAiB,CAC/B,OAAO,EAAE,MAAM,EACf,QAAQ,EAAE,MAAM,EAChB,SAAS,EAAE,MAAM,UAKlB;AAED,wBAAgB,qBAAqB,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,UAEtE;AAED;;;;;;;;;GASG;AACH,wBAAsB,6BAA6B,CAAC,EAClD,eAAe,EACf,QAAQ,EACR,OAAO,GACR,EAAE;IACD,eAAe,EAAE,MAAM,CAAC;IACxB,QAAQ,EAAE,MAAM,CAAC;IACjB,OAAO,EAAE,MAAM,CAAC;CACjB,GAAG,OAAO,CAAC;IACV,SAAS,EAAE,MAAM,EAAE,CAAC;IACpB,UAAU,EAAE,MAAM,CAAC;IACnB,UAAU,EAAE,MAAM,EAAE,CAAC;CACtB,CAAC,CAgED;AAED,wBAAgB,mBAAmB,CAAC,eAAe,EAAE,MAAM,UAM1D;AAED,wBAAgB,2BAA2B,uBAQ1C"}

package/dist/uploader/index.js CHANGED Viewed

@@ -5,8 +5,8 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.checkIfResultsUploadAllowed = exports.getUploadPathForRun = exports.uploadTestResultsUsingPrjRepo = exports.getRelativeUploadPath = exports.getFullUploadPath = exports.UPLOAD_DOMAIN = exports.UPLOAD_BUCKET = void 0;
 const r2_uploader_1 = require("@empiricalrun/r2-uploader");
-const reporter_1 = require("@empiricalrun/reporter");
 const path_1 = __importDefault(require("path"));
+const utils_1 = require("./utils");
 // json summary of test results
 // originally we used to upload test results directory for this
 // but now we have our test results (per testcase artifacts) inside playwright-report/data
@@ -55,8 +55,8 @@ async function uploadTestResultsUsingPrjRepo({ projectRepoName, testName, repoDi
     const fileNames = Object.keys(files);
     console.log("Uploaded files", fileNames.map((f) => getFullUploadPath(repoDir, f, uploadDir)));
     const defaultLocation = path_1.default.join(repoDir, "playwright-report", "summary.json");
-    const results = (0, reporter_1.parseJsonReport)(defaultLocation);
-    const flatTestsList = (0, reporter_1.getFlattenedTestList)(results.suites);
+    const results = (0, utils_1.parseJsonReport)(defaultLocation);
+    const flatTestsList = (0, utils_1.getFlattenedTestList)(results.suites);
     const testAttachmentPaths = [];
     for (const test of flatTestsList) {
         if (test.title === testName) {

package/dist/uploader/utils.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+import type { JSONReportSpec, JSONReportSuite } from "@playwright/test/reporter";
+export declare function parseJsonReport<T>(srcFile: string): T;
+export type flattenedSpecT = JSONReportSpec & {
+    nesting: string[];
+    suitesString: string;
+};
+export declare const getFlattenedTestList: (suites: JSONReportSuite[]) => flattenedSpecT[];
+//# sourceMappingURL=utils.d.ts.map

package/dist/uploader/utils.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"utils.d.ts","sourceRoot":"","sources":["../../src/uploader/utils.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,cAAc,EACd,eAAe,EAChB,MAAM,2BAA2B,CAAC;AAGnC,wBAAgB,eAAe,CAAC,CAAC,EAAE,OAAO,EAAE,MAAM,GAAG,CAAC,CAErD;AAMD,MAAM,MAAM,cAAc,GAAG,cAAc,GAAG;IAC5C,OAAO,EAAE,MAAM,EAAE,CAAC;IAClB,YAAY,EAAE,MAAM,CAAC;CACtB,CAAC;AACF,eAAO,MAAM,oBAAoB,WACvB,eAAe,EAAE,KACxB,cAAc,EA4BhB,CAAC"}

package/dist/uploader/utils.js ADDED Viewed

@@ -0,0 +1,35 @@
+"use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.getFlattenedTestList = exports.parseJsonReport = void 0;
+const fs_1 = __importDefault(require("fs"));
+function parseJsonReport(srcFile) {
+    return JSON.parse(fs_1.default.readFileSync(srcFile, { encoding: "utf-8" }));
+}
+exports.parseJsonReport = parseJsonReport;
+const getFlattenedTestList = (suites) => {
+    let flattenedSpecs = [];
+    const traverseSuites = (suite, nesting = []) => {
+        nesting = [...nesting, suite.title];
+        flattenedSpecs.push(...suite.specs.map((spec) => {
+            const finalNesting = [...nesting, spec.title];
+            const suites = nesting.slice(1);
+            const suitesString = suites.length ? suites.join("~~") : "~~";
+            return {
+                ...spec,
+                nesting: finalNesting,
+                suitesString,
+            };
+        }));
+        // Traverse nested suites recursively
+        if (suite.suites && suite.suites.length > 0) {
+            suite.suites.forEach((suite) => traverseSuites(suite, nesting));
+        }
+    };
+    // Start the traversal from the top-level suites
+    suites.forEach((suite) => traverseSuites(suite));
+    return flattenedSpecs;
+};
+exports.getFlattenedTestList = getFlattenedTestList;

package/dist/utils/repo-tree.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"repo-tree.d.ts","sourceRoot":"","sources":["../../src/utils/repo-tree.ts"],"names":[],"mappings":"AAGA,eAAO,MAAM,eAAe,~~qBAQ3B~~,CAAC;AAEF,wBAAgB,iBAAiB,CAAC,OAAO,EAAE,MAAM,EAAE,OAAO,KAAK,UAsE9D"}
1	+ {"version":3,"file":"repo-tree.d.ts","sourceRoot":"","sources":["../../src/utils/repo-tree.ts"],"names":[],"mappings":"AAGA,eAAO,MAAM,eAAe,qBAU3B,CAAC;AAEF,wBAAgB,iBAAiB,CAAC,OAAO,EAAE,MAAM,EAAE,OAAO,KAAK,UAsE9D"}

package/dist/utils/repo-tree.js CHANGED Viewed

@@ -13,7 +13,9 @@ exports.DEFAULT_EXCLUDE = [
     /\.git/,
     ".DS_Store",
     "playwright-report",
+    "test-results",
     ".empiricalrun",
+    "auth",
 ];
 function generateAsciiTree(dirPath, options = {}) {
     const defaultOptions = {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@empiricalrun/test-gen",
-  "version": "0.51.5",
+  "version": "0.52.0",
   "publishConfig": {
     "registry": "https://registry.npmjs.org/",
     "access": "public"
@@ -48,6 +48,7 @@
     "@actions/core": "^1.10.1",
     "@babel/parser": "^7.26.3",
     "@types/sanitize-html": "^2.11.0",
+    "async-retry": "^1.3.3",
     "commander": "^12.1.0",
     "detect-port": "^1.6.1",
     "dotenv": "^16.4.5",
@@ -74,13 +75,13 @@
     "tsx": "^4.16.2",
     "typescript": "^5.3.3",
     "zod": "^3.23.8",
-    "@empiricalrun/llm": "^0.11.4",
+    "@empiricalrun/llm": "^0.12.0",
     "@empiricalrun/r2-uploader": "^0.3.8",
-    "@empiricalrun/reporter": "^0.23.2",
     "@empiricalrun/test-run": "^0.7.6"
   },
   "devDependencies": {
     "@playwright/test": "1.47.1",
+    "@types/async-retry": "^1.4.8",
     "@types/detect-port": "^1.3.5",
     "@types/express": "^4.17.21",
     "@types/fs-extra": "^11.0.4",

package/dist/agent/chat.d.ts DELETED Viewed

@@ -1,5 +0,0 @@
-export declare function chatAgent({ chatModel, useDiskForChatState, }: {
-    chatModel?: "claude-3-7-sonnet-20250219" | "claude-3-5-sonnet-20241022";
-    useDiskForChatState?: boolean;
-}): Promise<string>;
-//# sourceMappingURL=chat.d.ts.map

package/dist/agent/chat.d.ts.map DELETED Viewed

	@@ -1 +0,0 @@
1	- {"version":3,"file":"chat.d.ts","sourceRoot":"","sources":["../../src/agent/chat.ts"],"names":[],"mappings":"AA+FA,wBAAsB,SAAS,CAAC,EAC9B,SAAwC,EACxC,mBAAmB,GACpB,EAAE;IACD,SAAS,CAAC,EAAE,4BAA4B,GAAG,4BAA4B,CAAC;IACxE,mBAAmB,CAAC,EAAE,OAAO,CAAC;CAC/B,mBAkHA"}

package/dist/agent/chat.js DELETED Viewed

@@ -1,188 +0,0 @@
-"use strict";
-var __importDefault = (this && this.__importDefault) || function (mod) {
-    return (mod && mod.__esModule) ? mod : { "default": mod };
-};
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.chatAgent = void 0;
-const chat_1 = require("@empiricalrun/llm/chat");
-const path_1 = __importDefault(require("path"));
-const picocolors_1 = require("picocolors");
-const web_1 = require("../bin/utils/platform/web");
-const human_in_the_loop_1 = require("../human-in-the-loop");
-const diagnosis_fetcher_1 = require("../tools/diagnosis-fetcher");
-const grep_1 = require("../tools/grep");
-const test_gen_browser_1 = require("../tools/test-gen-browser");
-const test_run_1 = require("../tools/test-run");
-const test_run_fetcher_1 = require("../tools/test-run-fetcher");
-const zod_schema_1 = require("../tools/zod-schema");
-const repo_tree_1 = require("../utils/repo-tree");
-const systemPrompt = `
-You are a helpful assistant that can answer questions and help with tasks.
-You are given a set of tools to use to fulfill the user's request. Read their descriptions to
-understand what each tool does.
-# Tools
-For example, if the user asks you to run a test, you could use the runTest tool.
-Once the test is run, you will receive the results in the form of a JSON object.
-Summarize the results in a few sentences.
-If the user provides a diagnosis URL, you can use the fetchDiagnosisDetails tool
-to get more information about the test case and its results.
-If the user provides a test run URL, you can use the fetchTestRunDetails tool
-to get detailed information about a specific test run.
-Or if the user asks you to modify a test, you could use the generateTestWithBrowserAgent tool. If you suspect
-that a UI selector needs to be updated, using the browser agent is a good idea.
-Before using generateTestWithBrowserAgent, you need to prepare the test code for the browser agent.
-You can do this by using the str_replace_editor tool to add a TODO comment to the test code. This
-comment should explain to the browser agent what to do.
-For example, if the expected modification is to click on a login button, you could add the following comment.
-// TODO(agent): Click on the login button
-The position of the comment is important: the browser agent will look for this comment and replace it with
-the actual code to click on the login button. If you are fixing a failing test, your comment should be
-around the failing line of code, so that it can be replaced/modified.
-# Repo context
-You are running as a CLI tool inside the directory of the repo where this test file is located. Here is
-the repo directory structure:
-${(0, repo_tree_1.generateAsciiTree)(process.cwd())}
-While specifying paths to files, use relative paths from the current working directory. For example:
-- Correct path: "tests/lesson.spec.ts"
-- Incorrect path: "/repo/tests/lesson.spec.ts" or "${path_1.default.basename(process.cwd())}/tests/lesson.spec.ts"
-# Rules for fixing Playwright tests
-You must follow these rules while adding new tests or modifying existing tests. There can be exceptions to these rules, but
-ONLY when explicitly asked for by the user.
-1. Do not add any conditional logic or try catch blocks in a test. A good test deterministically tests a user scenario
-2. Trust Playwright's ability to auto-wait while taking actions on elements. For example, do not add checks on locator.isVisible() before clicking on it: Playwright already does this
-3. Do not add waitForTimeout or waitForLoadState in a test. Playwright will automatically wait for the page to load.
-4. You can't delete some steps from the test to make it pass. The test needs to accomplish its objective (which is to validate a particular user scenario)
-# Proactiveness
-You are allowed to be proactive, but only when the user asks you to do something. You should strive to
-strike a balance between:
-1. Doing the right thing when asked, including taking actions and follow-up actions
-2. Not surprising the user with actions you take without asking. It is okay to ask the user for confirmation before taking actions.
-`;
-const tools = [
-    test_run_1.runTestTool,
-    test_gen_browser_1.generateTestWithBrowserAgent,
-    diagnosis_fetcher_1.diagnosisTool,
-    grep_1.grepTool,
-    test_run_fetcher_1.testRunTool,
-];
-const toolExecutors = {
-    ...Object.fromEntries(tools.map((tool) => [tool.schema.name, tool.execute])),
-    str_replace_editor: (input) => (0, chat_1.strReplaceEditorTool)(input, web_1.validateTypescript),
-};
-async function chatAgent({ chatModel = "claude-3-7-sonnet-20250219", useDiskForChatState, }) {
-    const ora = (await import("ora")).default;
-    let userPrompt = undefined;
-    let chatState = useDiskForChatState ? chat_1.ChatState.load() : new chat_1.ChatState(false);
-    const handleSigInt = () => {
-        console.log(`\n${(0, picocolors_1.gray)("Usage summary -> " + chatState.getUsageSummary())}`);
-        process.exit(0);
-    };
-    process.once("SIGINT", handleSigInt);
-    process.once("SIGTERM", handleSigInt);
-    if (chatState.askUserForInput) {
-        // Show last message to the user for context when we loaded from disk
-        const messages = chatState.messages;
-        const lastMessage = messages[messages.length - 1];
-        if (lastMessage && Array.isArray(lastMessage.content)) {
-            const textContent = lastMessage.content.find((b) => b.type === "text");
-            if (textContent) {
-                const role = lastMessage.role.charAt(0).toUpperCase() + lastMessage.role.slice(1);
-                console.log(`${role}: ${textContent.text}`);
-            }
-        }
-    }
-    while (!userPrompt?.toLowerCase().includes("stop")) {
-        chatState.saveToDisk();
-        if (chatState.askUserForInput) {
-            try {
-                userPrompt = await human_in_the_loop_1.humanLoop.getFeedback({
-                    message: "User:",
-                });
-            }
-            catch (e) {
-                // https://github.com/SBoudrias/Inquirer.js/issues/1502#issuecomment-2275991680
-                if (e instanceof Error && e.name === "ExitPromptError") {
-                    console.log(`\n${(0, picocolors_1.gray)("Usage summary -> " + chatState.getUsageSummary())}`);
-                    process.exit(0);
-                }
-                throw e;
-            }
-            chatState.pushMessage({
-                role: "user",
-                content: [
-                    {
-                        type: "text",
-                        text: userPrompt,
-                    },
-                ],
-            });
-            continue;
-        }
-        const toolUse = chatState.getPendingToolCall();
-        if (toolUse) {
-            const spinner = ora(`Executing tool ${toolUse.name} with args: ${JSON.stringify(toolUse.input)}`).start();
-            const toolExecutor = toolExecutors[toolUse.name];
-            if (!toolExecutor) {
-                throw new Error(`Tool ${toolUse.name} not found`);
-            }
-            const toolResult = await toolExecutor(toolUse.input);
-            if (toolResult.isError) {
-                spinner.fail(`Tool ${toolUse.name} failed with error: ${toolResult.result}`);
-            }
-            else {
-                spinner.succeed(`Tool ${toolUse.name} completed`);
-            }
-            chatState.pushMessage({
-                role: "user",
-                content: [
-                    {
-                        type: "tool_result",
-                        tool_use_id: toolUse.id,
-                        content: toolResult.result,
-                        is_error: toolResult.isError,
-                    },
-                ],
-            });
-            continue;
-        }
-        const spinner = ora("Claude is working...").start();
-        const response = await (0, chat_1.createClaudeMessage)({
-            systemPrompt,
-            messages: chatState.getMessagesForCreateCompletion(),
-            tools: tools.map((tool) => (0, chat_1.convertOpenAISchemaToAnthropic)((0, zod_schema_1.zodToOpenAITool)(tool.schema))),
-            model: chatModel,
-            withStrReplaceEditor: true,
-        });
-        spinner.stop();
-        if (!response) {
-            throw new Error("No response from LLM");
-        }
-        chatState.pushMessage(response);
-        const textBlock = response.content.find((b) => b.type === "text");
-        if (textBlock) {
-            console.log("Assistant:", textBlock.text);
-        }
-    }
-    const usageSummary = chatState.getUsageSummary();
-    console.log(`\n${(0, picocolors_1.gray)("Usage summary -> " + chatState.getUsageSummary())}`);
-    return usageSummary;
-}
-exports.chatAgent = chatAgent;