npm - @midscene/core - Versions diffs - 0.21.4-beta-20250711063424.0 → 0.21.4-beta-20250714025212.0 - Mend

@midscene/core 0.21.4-beta-20250711063424.0 → 0.21.4-beta-20250714025212.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/dist/es/ai-model.d.ts +36 -24
package/dist/es/ai-model.js +5 -1
package/dist/es/{chunk-QT5OZCDN.js → chunk-H3KP5MGB.js} +407 -219
package/dist/es/chunk-H3KP5MGB.js.map +1 -0
package/dist/es/{chunk-2CMOAEAS.js → chunk-QKX52XS3.js} +3 -3
package/dist/es/index.d.ts +4 -4
package/dist/es/index.js +2 -2
package/dist/es/{llm-planning-fe687364.d.ts → llm-planning-b342ff86.d.ts} +1 -1
package/dist/es/{types-b0b4c68e.d.ts → types-05553e39.d.ts} +32 -1
package/dist/es/utils.d.ts +1 -1
package/dist/es/utils.js +1 -1
package/dist/lib/ai-model.d.ts +36 -24
package/dist/lib/ai-model.js +6 -2
package/dist/lib/{chunk-QT5OZCDN.js → chunk-H3KP5MGB.js} +421 -233
package/dist/lib/chunk-H3KP5MGB.js.map +1 -0
package/dist/lib/{chunk-2CMOAEAS.js → chunk-QKX52XS3.js} +3 -3
package/dist/lib/index.d.ts +4 -4
package/dist/lib/index.js +12 -12
package/dist/lib/{llm-planning-fe687364.d.ts → llm-planning-b342ff86.d.ts} +1 -1
package/dist/lib/{types-b0b4c68e.d.ts → types-05553e39.d.ts} +32 -1
package/dist/lib/utils.d.ts +1 -1
package/dist/lib/utils.js +2 -2
package/dist/types/ai-model.d.ts +36 -24
package/dist/types/index.d.ts +4 -4
package/dist/types/{llm-planning-fe687364.d.ts → llm-planning-b342ff86.d.ts} +1 -1
package/dist/types/{types-b0b4c68e.d.ts → types-05553e39.d.ts} +32 -1
package/dist/types/utils.d.ts +1 -1
package/package.json +3 -3
package/dist/es/chunk-QT5OZCDN.js.map +0 -1
package/dist/lib/chunk-QT5OZCDN.js.map +0 -1
/package/dist/es/{chunk-2CMOAEAS.js.map → chunk-QKX52XS3.js.map} +0 -0
/package/dist/lib/{chunk-2CMOAEAS.js.map → chunk-QKX52XS3.js.map} +0 -0

package/dist/es/{chunk-QT5OZCDN.js → chunk-H3KP5MGB.js} RENAMED Viewed

@@ -1135,13 +1135,24 @@ pageDescription:
 // src/ai-model/service-caller/index.ts
 function checkAIConfig() {
-  if (getAIConfig(OPENAI_API_KEY))
+  const openaiKey = getAIConfig(OPENAI_API_KEY);
+  const azureConfig = getAIConfig(MIDSCENE_USE_AZURE_OPENAI);
+  const anthropicKey = getAIConfig(ANTHROPIC_API_KEY);
+  const initConfigJson = getAIConfig(MIDSCENE_OPENAI_INIT_CONFIG_JSON);
+  console.log("AI Config Check:", {
+    hasOpenAI: !!openaiKey,
+    hasAzure: !!azureConfig,
+    hasAnthropic: !!anthropicKey,
+    hasInitConfig: !!initConfigJson,
+    openaiKeyPrefix: openaiKey ? `${openaiKey.substring(0, 10)}...` : "none"
+  });
+  if (openaiKey)
     return true;
-  if (getAIConfig(MIDSCENE_USE_AZURE_OPENAI))
+  if (azureConfig)
     return true;
-  if (getAIConfig(ANTHROPIC_API_KEY))
+  if (anthropicKey)
     return true;
-  return Boolean(getAIConfig(MIDSCENE_OPENAI_INIT_CONFIG_JSON));
+  return Boolean(initConfigJson);
 }
 var debugConfigInitialized = false;
 function initDebugConfig() {
@@ -1290,7 +1301,7 @@ Please check your config.`
   }
   throw new Error("Openai SDK or Anthropic SDK is not initialized");
 }
-async function call(messages, AIActionTypeValue, responseFormat) {
+async function call(messages, AIActionTypeValue, responseFormat, options) {
   const { completion, style } = await createChatClient({
     AIActionTypeValue
   });
@@ -1300,91 +1311,217 @@ async function call(messages, AIActionTypeValue, responseFormat) {
   const debugProfileDetail = getDebug2("ai:profile:detail");
   const startTime = Date.now();
   const model = getModelName();
+  const isStreaming = options?.stream && options?.onChunk;
   let content;
+  let accumulated = "";
   let usage;
   let timeCost;
   const commonConfig = {
     temperature: vlLocateMode3() === "vlm-ui-tars" ? 0 : 0.1,
-    stream: false,
+    stream: !!isStreaming,
     max_tokens: typeof maxTokens === "number" ? maxTokens : Number.parseInt(maxTokens || "2048", 10),
     ...vlLocateMode3() === "qwen-vl" ? {
       vl_high_resolution_images: true
     } : {}
   };
-  if (style === "openai") {
-    debugCall(`sending request to ${model}`);
-    let result;
-    try {
-      const startTime2 = Date.now();
-      result = await completion.create({
-        model,
-        messages,
-        response_format: responseFormat,
-        ...commonConfig
-      });
-      timeCost = Date.now() - startTime2;
-    } catch (e) {
-      const newError = new Error(
-        `failed to call AI model service: ${e.message}. Trouble shooting: https://midscenejs.com/model-provider.html`,
-        {
-          cause: e
-        }
+  try {
+    if (style === "openai") {
+      debugCall(
+        `sending ${isStreaming ? "streaming " : ""}request to ${model}`
       );
-      throw newError;
-    }
-    debugProfileStats(
-      `model, ${model}, mode, ${vlLocateMode3() || "default"}, ui-tars-version, ${uiTarsModelVersion()}, prompt-tokens, ${result.usage?.prompt_tokens || ""}, completion-tokens, ${result.usage?.completion_tokens || ""}, total-tokens, ${result.usage?.total_tokens || ""}, cost-ms, ${Date.now() - startTime}, requestId, ${result._request_id || ""}`
-    );
-    debugProfileDetail(`model usage detail: ${JSON.stringify(result.usage)}`);
-    assert3(
-      result.choices,
-      `invalid response from LLM service: ${JSON.stringify(result)}`
-    );
-    content = result.choices[0].message.content;
-    debugCall(`response: ${content}`);
-    assert3(content, "empty content");
-    usage = result.usage;
-  } else if (style === "anthropic") {
-    const convertImageContent = (content2) => {
-      if (content2.type === "image_url") {
-        const imgBase64 = content2.image_url.url;
-        assert3(imgBase64, "image_url is required");
-        return {
-          source: {
-            type: "base64",
-            media_type: imgBase64.includes("data:image/png;base64,") ? "image/png" : "image/jpeg",
-            data: imgBase64.split(",")[1]
+      if (isStreaming) {
+        const stream = await completion.create(
+          {
+            model,
+            messages,
+            response_format: responseFormat,
+            ...commonConfig
           },
-          type: "image"
-        };
+          {
+            stream: true
+          }
+        );
+        for await (const chunk of stream) {
+          const content2 = chunk.choices?.[0]?.delta?.content || "";
+          const reasoning_content = chunk.choices?.[0]?.delta?.reasoning_content || "";
+          if (chunk.usage) {
+            usage = chunk.usage;
+          }
+          if (content2 || reasoning_content) {
+            accumulated += content2;
+            const chunkData = {
+              content: content2,
+              reasoning_content,
+              accumulated,
+              isComplete: false,
+              usage: void 0
+            };
+            options.onChunk(chunkData);
+          }
+          if (chunk.choices?.[0]?.finish_reason) {
+            timeCost = Date.now() - startTime;
+            if (!usage) {
+              const estimatedTokens = Math.max(
+                1,
+                Math.floor(accumulated.length / 4)
+              );
+              usage = {
+                prompt_tokens: estimatedTokens,
+                completion_tokens: estimatedTokens,
+                total_tokens: estimatedTokens * 2
+              };
+            }
+            const finalChunk = {
+              content: "",
+              accumulated,
+              reasoning_content: "",
+              isComplete: true,
+              usage: {
+                prompt_tokens: usage.prompt_tokens ?? 0,
+                completion_tokens: usage.completion_tokens ?? 0,
+                total_tokens: usage.total_tokens ?? 0,
+                time_cost: timeCost ?? 0
+              }
+            };
+            options.onChunk(finalChunk);
+            break;
+          }
+        }
+        content = accumulated;
+        debugProfileStats(
+          `streaming model, ${model}, mode, ${vlLocateMode3() || "default"}, cost-ms, ${timeCost}`
+        );
+      } else {
+        const result = await completion.create({
+          model,
+          messages,
+          response_format: responseFormat,
+          ...commonConfig
+        });
+        timeCost = Date.now() - startTime;
+        debugProfileStats(
+          `model, ${model}, mode, ${vlLocateMode3() || "default"}, ui-tars-version, ${uiTarsModelVersion()}, prompt-tokens, ${result.usage?.prompt_tokens || ""}, completion-tokens, ${result.usage?.completion_tokens || ""}, total-tokens, ${result.usage?.total_tokens || ""}, cost-ms, ${timeCost}, requestId, ${result._request_id || ""}`
+        );
+        debugProfileDetail(
+          `model usage detail: ${JSON.stringify(result.usage)}`
+        );
+        assert3(
+          result.choices,
+          `invalid response from LLM service: ${JSON.stringify(result)}`
+        );
+        content = result.choices[0].message.content;
+        usage = result.usage;
       }
-      return content2;
+      debugCall(`response: ${content}`);
+      assert3(content, "empty content");
+    } else if (style === "anthropic") {
+      const convertImageContent = (content2) => {
+        if (content2.type === "image_url") {
+          const imgBase64 = content2.image_url.url;
+          assert3(imgBase64, "image_url is required");
+          return {
+            source: {
+              type: "base64",
+              media_type: imgBase64.includes("data:image/png;base64,") ? "image/png" : "image/jpeg",
+              data: imgBase64.split(",")[1]
+            },
+            type: "image"
+          };
+        }
+        return content2;
+      };
+      if (isStreaming) {
+        const stream = await completion.create({
+          model,
+          system: "You are a versatile professional in software UI automation",
+          messages: messages.map((m) => ({
+            role: "user",
+            content: Array.isArray(m.content) ? m.content.map(convertImageContent) : m.content
+          })),
+          response_format: responseFormat,
+          ...commonConfig
+        });
+        for await (const chunk of stream) {
+          const content2 = chunk.delta?.text || "";
+          if (content2) {
+            accumulated += content2;
+            const chunkData = {
+              content: content2,
+              accumulated,
+              reasoning_content: "",
+              isComplete: false,
+              usage: void 0
+            };
+            options.onChunk(chunkData);
+          }
+          if (chunk.type === "message_stop") {
+            timeCost = Date.now() - startTime;
+            const anthropicUsage = chunk.usage;
+            const finalChunk = {
+              content: "",
+              accumulated,
+              reasoning_content: "",
+              isComplete: true,
+              usage: anthropicUsage ? {
+                prompt_tokens: anthropicUsage.input_tokens ?? 0,
+                completion_tokens: anthropicUsage.output_tokens ?? 0,
+                total_tokens: (anthropicUsage.input_tokens ?? 0) + (anthropicUsage.output_tokens ?? 0),
+                time_cost: timeCost ?? 0
+              } : void 0
+            };
+            options.onChunk(finalChunk);
+            break;
+          }
+        }
+        content = accumulated;
+      } else {
+        const result = await completion.create({
+          model,
+          system: "You are a versatile professional in software UI automation",
+          messages: messages.map((m) => ({
+            role: "user",
+            content: Array.isArray(m.content) ? m.content.map(convertImageContent) : m.content
+          })),
+          response_format: responseFormat,
+          ...commonConfig
+        });
+        timeCost = Date.now() - startTime;
+        content = result.content[0].text;
+        usage = result.usage;
+      }
+      assert3(content, "empty content");
+    }
+    if (isStreaming && !usage) {
+      const estimatedTokens = Math.max(
+        1,
+        Math.floor((content || "").length / 4)
+      );
+      usage = {
+        prompt_tokens: estimatedTokens,
+        completion_tokens: estimatedTokens,
+        total_tokens: estimatedTokens * 2
+      };
+    }
+    return {
+      content: content || "",
+      usage: usage ? {
+        prompt_tokens: usage.prompt_tokens ?? 0,
+        completion_tokens: usage.completion_tokens ?? 0,
+        total_tokens: usage.total_tokens ?? 0,
+        time_cost: timeCost ?? 0
+      } : void 0,
+      isStreamed: !!isStreaming
     };
-    const startTime2 = Date.now();
-    const result = await completion.create({
-      model,
-      system: "You are a versatile professional in software UI automation",
-      messages: messages.map((m) => ({
-        role: "user",
-        content: Array.isArray(m.content) ? m.content.map(convertImageContent) : m.content
-      })),
-      response_format: responseFormat,
-      ...commonConfig
-    });
-    timeCost = Date.now() - startTime2;
-    content = result.content[0].text;
-    assert3(content, "empty content");
-    usage = result.usage;
+  } catch (e) {
+    console.error(" call AI error", e);
+    const newError = new Error(
+      `failed to call ${isStreaming ? "streaming " : ""}AI model service: ${e.message}. Trouble shooting: https://midscenejs.com/model-provider.html`,
+      {
+        cause: e
+      }
+    );
+    throw newError;
   }
-  return {
-    content: content || "",
-    usage: {
-      prompt_tokens: usage?.prompt_tokens ?? 0,
-      completion_tokens: usage?.completion_tokens ?? 0,
-      total_tokens: usage?.total_tokens ?? 0,
-      time_cost: timeCost ?? 0
-    }
-  };
 }
 async function callToGetJSONObject(messages, AIActionTypeValue) {
   let responseFormat;
@@ -1464,6 +1601,9 @@ function safeParseJson(input) {
 // src/ai-model/prompt/playwright-generator.ts
 import { PLAYWRIGHT_EXAMPLE_CODE } from "@midscene/shared/constants";
+// src/ai-model/prompt/yaml-generator.ts
+import { YAML_EXAMPLE_CODE } from "@midscene/shared/constants";
 var getScreenshotsForLLM = (events, maxScreenshots = 1) => {
   const eventsWithScreenshots = events.filter(
     (event) => event.screenshotBefore || event.screenshotAfter || event.screenshotWithBox
@@ -1529,7 +1669,6 @@ var prepareEventSummary = (events, options = {}) => {
   const filteredEvents = filterEventsByType(events);
   const eventCounts = createEventCounts(filteredEvents, events.length);
   const startUrl = filteredEvents.navigationEvents.length > 0 ? filteredEvents.navigationEvents[0].url || "" : "";
-  const pageTitles = filteredEvents.navigationEvents.map((event) => event.title).filter((title) => Boolean(title)).slice(0, 5);
   const clickDescriptions = filteredEvents.clickEvents.map((event) => event.elementDescription).filter((desc) => Boolean(desc)).slice(0, 10);
   const inputDescriptions = extractInputDescriptions(
     filteredEvents.inputEvents
@@ -1540,7 +1679,6 @@ var prepareEventSummary = (events, options = {}) => {
     testName: options.testName || "Automated test from recorded events",
     startUrl,
     eventCounts,
-    pageTitles,
     urls,
     clickDescriptions,
     inputDescriptions,
@@ -1575,6 +1713,141 @@ var validateEvents = (events) => {
     throw new Error("No events provided for test generation");
   }
 };
+var generateYamlTest = async (events, options = {}) => {
+  try {
+    validateEvents(events);
+    const summary = prepareEventSummary(events, {
+      testName: options.testName,
+      maxScreenshots: options.maxScreenshots || 3
+    });
+    const yamlSummary = {
+      ...summary,
+      includeTimestamps: options.includeTimestamps || false
+    };
+    const screenshots = getScreenshotsForLLM(
+      events,
+      options.maxScreenshots || 3
+    );
+    const prompt = [
+      {
+        role: "system",
+        content: `You are an expert in Midscene.js YAML test generation. Generate clean, accurate YAML following these rules: ${YAML_EXAMPLE_CODE}`
+      },
+      {
+        role: "user",
+        content: `Generate YAML test for Midscene.js automation from recorded browser events.
+Event Summary:
+${JSON.stringify(yamlSummary, null, 2)}
+Convert events:
+- navigation → target.url
+- click → aiTap with element description
+- input → aiInput with value and locate
+- scroll → aiScroll with appropriate direction
+- Add aiAssert for important state changes
+Respond with YAML only, no explanations.`
+      }
+    ];
+    if (screenshots.length > 0) {
+      prompt.push({
+        role: "user",
+        content: "Here are screenshots from the recording session to help you understand the context:"
+      });
+      prompt.push({
+        role: "user",
+        content: screenshots.map((screenshot) => ({
+          type: "image_url",
+          image_url: {
+            url: screenshot
+          }
+        }))
+      });
+    }
+    const response = await call(prompt, 2 /* EXTRACT_DATA */);
+    if (response?.content && typeof response.content === "string") {
+      return response.content;
+    }
+    throw new Error("Failed to generate YAML test configuration");
+  } catch (error) {
+    throw new Error(`Failed to generate YAML test: ${error}`);
+  }
+};
+var generateYamlTestStream = async (events, options = {}) => {
+  try {
+    validateEvents(events);
+    const summary = prepareEventSummary(events, {
+      testName: options.testName,
+      maxScreenshots: options.maxScreenshots || 3
+    });
+    const yamlSummary = {
+      ...summary,
+      includeTimestamps: options.includeTimestamps || false
+    };
+    const screenshots = getScreenshotsForLLM(
+      events,
+      options.maxScreenshots || 3
+    );
+    const prompt = [
+      {
+        role: "system",
+        content: `You are an expert in Midscene.js YAML test generation. Generate clean, accurate YAML following these rules: ${YAML_EXAMPLE_CODE}`
+      },
+      {
+        role: "user",
+        content: `Generate YAML test for Midscene.js automation from recorded browser events.
+Event Summary:
+${JSON.stringify(yamlSummary, null, 2)}
+Convert events:
+- navigation → target.url
+- click → aiTap with element description
+- input → aiInput with value and locate
+- scroll → aiScroll with appropriate direction
+- Add aiAssert for important state changes
+Respond with YAML only, no explanations.`
+      }
+    ];
+    if (screenshots.length > 0) {
+      prompt.push({
+        role: "user",
+        content: "Here are screenshots from the recording session to help you understand the context:"
+      });
+      prompt.push({
+        role: "user",
+        content: screenshots.map((screenshot) => ({
+          type: "image_url",
+          image_url: {
+            url: screenshot
+          }
+        }))
+      });
+    }
+    if (options.stream && options.onChunk) {
+      return await call(prompt, 2 /* EXTRACT_DATA */, void 0, {
+        stream: true,
+        onChunk: options.onChunk
+      });
+    } else {
+      const response = await call(prompt, 2 /* EXTRACT_DATA */);
+      if (response?.content && typeof response.content === "string") {
+        return {
+          content: response.content,
+          usage: response.usage,
+          isStreamed: false
+        };
+      }
+      throw new Error("Failed to generate YAML test configuration");
+    }
+  } catch (error) {
+    throw new Error(`Failed to generate YAML test: ${error}`);
+  }
+};
+// src/ai-model/prompt/playwright-generator.ts
 var generatePlaywrightTest = async (events, options = {}) => {
   validateEvents(events);
   const summary = prepareEventSummary(events, {
@@ -1628,156 +1901,69 @@ ${PLAYWRIGHT_EXAMPLE_CODE}`;
   }
   throw new Error("Failed to generate Playwright test code");
 };
-// src/ai-model/prompt/yaml-generator.ts
-import { YAML_EXAMPLE_CODE } from "@midscene/shared/constants";
-var getScreenshotsForLLM2 = (events, maxScreenshots = 1) => {
-  const eventsWithScreenshots = events.filter(
-    (event) => event.screenshotBefore || event.screenshotAfter || event.screenshotWithBox
-  );
-  const sortedEvents = [...eventsWithScreenshots].sort((a, b) => {
-    if (a.type === "navigation" && b.type !== "navigation")
-      return -1;
-    if (a.type !== "navigation" && b.type === "navigation")
-      return 1;
-    if (a.type === "click" && b.type !== "click")
-      return -1;
-    if (a.type !== "click" && b.type === "click")
-      return 1;
-    return 0;
+var generatePlaywrightTestStream = async (events, options = {}) => {
+  validateEvents(events);
+  const summary = prepareEventSummary(events, {
+    testName: options.testName,
+    maxScreenshots: options.maxScreenshots || 3
   });
-  const screenshots = [];
-  for (const event of sortedEvents) {
-    const screenshot = event.screenshotWithBox || event.screenshotAfter || event.screenshotBefore;
-    if (screenshot && !screenshots.includes(screenshot)) {
-      screenshots.push(screenshot);
-      if (screenshots.length >= maxScreenshots)
-        break;
-    }
-  }
-  return screenshots;
-};
-var filterEventsByType2 = (events) => {
-  return {
-    navigationEvents: events.filter((event) => event.type === "navigation"),
-    clickEvents: events.filter((event) => event.type === "click"),
-    inputEvents: events.filter((event) => event.type === "input"),
-    scrollEvents: events.filter((event) => event.type === "scroll")
-  };
-};
-var createEventCounts2 = (filteredEvents, totalEvents) => {
-  return {
-    navigation: filteredEvents.navigationEvents.length,
-    click: filteredEvents.clickEvents.length,
-    input: filteredEvents.inputEvents.length,
-    scroll: filteredEvents.scrollEvents.length,
-    total: totalEvents
-  };
-};
-var extractInputDescriptions2 = (inputEvents) => {
-  return inputEvents.map((event) => ({
-    description: event.elementDescription || "",
-    value: event.value || ""
-  })).filter((item) => item.description && item.value);
-};
-var processEventsForLLM2 = (events) => {
-  return events.map((event) => ({
-    type: event.type,
-    timestamp: event.timestamp,
-    url: event.url,
-    title: event.title,
-    elementDescription: event.elementDescription,
-    value: event.value,
-    pageInfo: event.pageInfo,
-    elementRect: event.elementRect
-  }));
-};
-var prepareEventSummary2 = (events, options = {}) => {
-  const filteredEvents = filterEventsByType2(events);
-  const eventCounts = createEventCounts2(filteredEvents, events.length);
-  const startUrl = filteredEvents.navigationEvents.length > 0 ? filteredEvents.navigationEvents[0].url || "" : "";
-  const pageTitles = filteredEvents.navigationEvents.map((event) => event.title).filter((title) => Boolean(title)).slice(0, 5);
-  const clickDescriptions = filteredEvents.clickEvents.map((event) => event.elementDescription).filter((desc) => Boolean(desc)).slice(0, 10);
-  const inputDescriptions = extractInputDescriptions2(
-    filteredEvents.inputEvents
-  ).slice(0, 10);
-  const urls = filteredEvents.navigationEvents.map((e) => e.url).filter((url) => Boolean(url)).slice(0, 5);
-  const processedEvents = processEventsForLLM2(events);
-  return {
-    testName: options.testName || "Automated test from recorded events",
-    startUrl,
-    eventCounts,
-    pageTitles,
-    urls,
-    clickDescriptions,
-    inputDescriptions,
-    events: processedEvents
+  const playwrightSummary = {
+    ...summary,
+    waitForNetworkIdle: options.waitForNetworkIdle !== false,
+    waitForNetworkIdleTimeout: options.waitForNetworkIdleTimeout || 2e3,
+    viewportSize: options.viewportSize || { width: 1280, height: 800 }
   };
-};
-var validateEvents2 = (events) => {
-  if (!events.length) {
-    throw new Error("No events provided for test generation");
-  }
-};
-var generateYamlTest = async (events, options = {}) => {
-  try {
-    validateEvents2(events);
-    const summary = prepareEventSummary2(events, {
-      testName: options.testName,
-      maxScreenshots: options.maxScreenshots || 3
-    });
-    const yamlSummary = {
-      ...summary,
-      includeTimestamps: options.includeTimestamps || false
-    };
-    const screenshots = getScreenshotsForLLM2(
-      events,
-      options.maxScreenshots || 3
-    );
-    const prompt = [
-      {
-        role: "system",
-        content: `You are an expert in Midscene.js YAML test generation. Generate clean, accurate YAML following these rules: ${YAML_EXAMPLE_CODE}`
-      },
-      {
-        role: "user",
-        content: `Generate YAML test for Midscene.js automation from recorded browser events.
+  const screenshots = getScreenshotsForLLM(events, options.maxScreenshots || 3);
+  const promptText = `Generate a Playwright test using @midscene/web/playwright that reproduces this recorded browser session. The test should be based on the following events and follow the structure of the example provided. Make the test descriptive with appropriate assertions and validations.
 Event Summary:
-${JSON.stringify(yamlSummary, null, 2)}
+${JSON.stringify(playwrightSummary, null, 2)}
-Convert events:
-- navigation → target.url
-- click → aiTap with element description
-- input → aiInput with value and locate
-- scroll → aiScroll with appropriate direction
-- Add aiAssert for important state changes
+Generated code should:
+1. Import required dependencies
+2. Set up the test with proper configuration
+3. Include a beforeEach hook to navigate to the starting URL
+4. Implement a test that uses Midscene AI methods (aiTap, aiInput, aiAssert, etc.)
+5. Include appropriate assertions and validations
+6. Follow best practices for Playwright tests
+7. Be ready to execute without further modification
+8. can't wrap this test code in markdown code block
-Respond with YAML only, no explanations.`
-      }
-    ];
-    if (screenshots.length > 0) {
-      prompt.push({
-        role: "user",
-        content: "Here are screenshots from the recording session to help you understand the context:"
-      });
-      prompt.push({
-        role: "user",
-        content: screenshots.map((screenshot) => ({
-          type: "image_url",
-          image_url: {
-            url: screenshot
-          }
-        }))
-      });
+Respond ONLY with the complete Playwright test code, no explanations.`;
+  const messageContent = createMessageContent(
+    promptText,
+    screenshots,
+    options.includeScreenshots !== false
+  );
+  const systemPrompt = `You are an expert test automation engineer specializing in Playwright and Midscene.
+Your task is to generate a complete, executable Playwright test using @midscene/web/playwright that reproduces a recorded browser session.
+${PLAYWRIGHT_EXAMPLE_CODE}`;
+  const prompt = [
+    {
+      role: "system",
+      content: systemPrompt
+    },
+    {
+      role: "user",
+      content: messageContent
     }
+  ];
+  if (options.stream && options.onChunk) {
+    return await call(prompt, 2 /* EXTRACT_DATA */, void 0, {
+      stream: true,
+      onChunk: options.onChunk
+    });
+  } else {
     const response = await call(prompt, 2 /* EXTRACT_DATA */);
     if (response?.content && typeof response.content === "string") {
-      return response.content;
+      return {
+        content: response.content,
+        usage: response.usage,
+        isStreamed: false
+      };
     }
-    throw new Error("Failed to generate YAML test configuration");
-  } catch (error) {
-    throw new Error(`Failed to generate YAML test: ${error}`);
+    throw new Error("Failed to generate Playwright test code");
   }
 };
@@ -2567,8 +2753,10 @@ export {
   callAiFn,
   adaptBboxToRect,
   expandSearchArea,
-  generatePlaywrightTest,
   generateYamlTest,
+  generateYamlTestStream,
+  generatePlaywrightTest,
+  generatePlaywrightTestStream,
   AiLocateElement,
   AiLocateSection,
   AiExtractElementInfo,
@@ -2578,4 +2766,4 @@ export {
   resizeImageForUiTars
 };
-//# sourceMappingURL=chunk-QT5OZCDN.js.map
+//# sourceMappingURL=chunk-H3KP5MGB.js.map