npm - @langwatch/scenario - Versions diffs - 0.2.13 → 0.3.0 - Mend

@langwatch/scenario 0.2.13 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/README.md +35 -8
package/dist/{chunk-6SKQWXT7.mjs → chunk-3Z7E24UI.mjs} +26 -6
package/dist/{chunk-OL4RFXV4.mjs → chunk-RHTLQKEJ.mjs} +1 -1
package/dist/index.d.mts +109 -130
package/dist/index.d.ts +109 -130
package/dist/index.js +95 -75
package/dist/index.mjs +23 -23
package/dist/integrations/vitest/reporter.js +14 -10
package/dist/integrations/vitest/reporter.mjs +7 -3
package/dist/integrations/vitest/setup.js +70 -50
package/dist/integrations/vitest/setup.mjs +2 -2
package/package.json +6 -5

package/dist/index.js CHANGED Viewed

@@ -67,7 +67,7 @@ __export(agents_exports, {
 // src/agents/judge-agent.ts
 var import_ai = require("ai");
-var import_zod3 = require("zod");
+var import_v43 = require("zod/v4");
 // src/domain/index.ts
 var domain_exports = {};
@@ -85,15 +85,15 @@ __export(domain_exports, {
 });
 // src/domain/core/config.ts
-var import_zod = require("zod");
+var import_v4 = require("zod/v4");
 var DEFAULT_TEMPERATURE = 0;
-var scenarioProjectConfigSchema = import_zod.z.object({
-  defaultModel: import_zod.z.object({
-    model: import_zod.z.custom(),
-    temperature: import_zod.z.number().min(0).max(1).optional().default(DEFAULT_TEMPERATURE),
-    maxTokens: import_zod.z.number().optional()
+var scenarioProjectConfigSchema = import_v4.z.object({
+  defaultModel: import_v4.z.object({
+    model: import_v4.z.custom(),
+    temperature: import_v4.z.number().min(0).max(1).optional().default(DEFAULT_TEMPERATURE),
+    maxTokens: import_v4.z.number().optional()
   }).optional(),
-  headless: import_zod.z.boolean().optional().default(
+  headless: import_v4.z.boolean().optional().default(
     typeof process !== "undefined" ? !["false", "0"].includes(process.env.SCENARIO_HEADLESS || "false") : false
   )
 }).strict();
@@ -183,7 +183,7 @@ var criterionToParamName = (criterion) => {
 };
 // src/config/env.ts
-var import_zod2 = require("zod");
+var import_v42 = require("zod/v4");
 // src/config/log-levels.ts
 var LogLevel = /* @__PURE__ */ ((LogLevel2) => {
@@ -196,37 +196,37 @@ var LogLevel = /* @__PURE__ */ ((LogLevel2) => {
 var LOG_LEVELS = Object.values(LogLevel);
 // src/config/env.ts
-var envSchema = import_zod2.z.object({
+var envSchema = import_v42.z.object({
   /**
    * LangWatch API key for event reporting.
    * If not provided, events will not be sent to LangWatch.
    */
-  LANGWATCH_API_KEY: import_zod2.z.string().optional(),
+  LANGWATCH_API_KEY: import_v42.z.string().optional(),
   /**
    * LangWatch endpoint URL for event reporting.
    * Defaults to the production LangWatch endpoint.
    */
-  LANGWATCH_ENDPOINT: import_zod2.z.string().url().optional().default("https://app.langwatch.ai"),
+  LANGWATCH_ENDPOINT: import_v42.z.string().url().optional().default("https://app.langwatch.ai"),
   /**
    * Disables simulation report info messages when set to any truthy value.
    * Useful for CI/CD environments or when you want cleaner output.
    */
-  SCENARIO_DISABLE_SIMULATION_REPORT_INFO: import_zod2.z.string().optional().transform((val) => Boolean(val)),
+  SCENARIO_DISABLE_SIMULATION_REPORT_INFO: import_v42.z.string().optional().transform((val) => Boolean(val)),
   /**
    * Node environment - affects logging and behavior.
    * Defaults to 'development' if not specified.
    */
-  NODE_ENV: import_zod2.z.enum(["development", "production", "test"]).default("development"),
+  NODE_ENV: import_v42.z.enum(["development", "production", "test"]).default("development"),
   /**
    * Case-insensitive log level for the scenario package.
    * Defaults to 'info' if not specified.
    */
-  LOG_LEVEL: import_zod2.z.string().toUpperCase().pipe(import_zod2.z.nativeEnum(LogLevel)).optional().default("INFO" /* INFO */),
+  LOG_LEVEL: import_v42.z.string().toUpperCase().pipe(import_v42.z.nativeEnum(LogLevel)).optional().default("INFO" /* INFO */),
   /**
    * Scenario batch run ID.
    * If not provided, a random ID will be generated.
    */
-  SCENARIO_BATCH_RUN_ID: import_zod2.z.string().optional()
+  SCENARIO_BATCH_RUN_ID: import_v42.z.string().optional()
 });
 function getEnv() {
   return envSchema.parse(process.env);
@@ -423,24 +423,24 @@ ${criteriaList}
 function buildContinueTestTool() {
   return (0, import_ai.tool)({
     description: "Continue the test with the next step",
-    parameters: import_zod3.z.object({})
+    inputSchema: import_v43.z.object({})
   });
 }
 function buildFinishTestTool(criteria) {
   const criteriaNames = criteria.map(criterionToParamName);
   return (0, import_ai.tool)({
     description: "Complete the test with a final verdict",
-    parameters: import_zod3.z.object({
-      criteria: import_zod3.z.object(
+    inputSchema: import_v43.z.object({
+      criteria: import_v43.z.object(
         Object.fromEntries(
           criteriaNames.map((name, idx) => [
             name,
-            import_zod3.z.enum(["true", "false", "inconclusive"]).describe(criteria[idx])
+            import_v43.z.enum(["true", "false", "inconclusive"]).describe(criteria[idx])
           ])
         )
       ).strict().describe("Strict verdict for each criterion"),
-      reasoning: import_zod3.z.string().describe("Explanation of what the final verdict should be"),
-      verdict: import_zod3.z.enum(["success", "failure", "inconclusive"]).describe("The final verdict of the test")
+      reasoning: import_v43.z.string().describe("Explanation of what the final verdict should be"),
+      verdict: import_v43.z.enum(["success", "failure", "inconclusive"]).describe("The final verdict of the test")
     })
   });
 }
@@ -488,7 +488,7 @@ var JudgeAgent = class extends JudgeAgentAdapter {
       model: mergedConfig.model,
       messages,
       temperature: mergedConfig.temperature ?? 0,
-      maxTokens: mergedConfig.maxTokens,
+      maxOutputTokens: mergedConfig.maxTokens,
       tools,
       toolChoice
     });
@@ -497,7 +497,7 @@ var JudgeAgent = class extends JudgeAgentAdapter {
       const toolCall = completion.toolCalls[0];
       switch (toolCall.toolName) {
         case "finish_test": {
-          args = toolCall.args;
+          args = toolCall.input;
           const verdict = args.verdict || "inconclusive";
           const reasoning = args.reasoning || "No reasoning provided";
           const criteria = args.criteria || {};
@@ -595,7 +595,7 @@ var UserSimulatorAgent = class extends UserSimulatorAgentAdapter {
       model: mergedConfig.model,
       messages: reversedMessages,
       temperature: mergedConfig.temperature ?? DEFAULT_TEMPERATURE,
-      maxTokens: mergedConfig.maxTokens
+      maxOutputTokens: mergedConfig.maxTokens
     });
     const messageContent = completion.text;
     if (!messageContent) {
@@ -769,7 +769,7 @@ var ScenarioExecutionState = class {
 // src/events/schema.ts
 var import_core = require("@ag-ui/core");
-var import_zod4 = require("zod");
+var import_zod = require("zod");
 var Verdict = /* @__PURE__ */ ((Verdict2) => {
   Verdict2["SUCCESS"] = "success";
   Verdict2["FAILURE"] = "failure";
@@ -785,64 +785,64 @@ var ScenarioRunStatus = /* @__PURE__ */ ((ScenarioRunStatus2) => {
   ScenarioRunStatus2["FAILED"] = "FAILED";
   return ScenarioRunStatus2;
 })(ScenarioRunStatus || {});
-var baseEventSchema = import_zod4.z.object({
-  type: import_zod4.z.nativeEnum(import_core.EventType),
-  timestamp: import_zod4.z.number(),
-  rawEvent: import_zod4.z.any().optional()
+var baseEventSchema = import_zod.z.object({
+  type: import_zod.z.nativeEnum(import_core.EventType),
+  timestamp: import_zod.z.number(),
+  rawEvent: import_zod.z.any().optional()
 });
-var batchRunIdSchema = import_zod4.z.string();
-var scenarioRunIdSchema = import_zod4.z.string();
-var scenarioIdSchema = import_zod4.z.string();
+var batchRunIdSchema = import_zod.z.string();
+var scenarioRunIdSchema = import_zod.z.string();
+var scenarioIdSchema = import_zod.z.string();
 var baseScenarioEventSchema = baseEventSchema.extend({
   batchRunId: batchRunIdSchema,
   scenarioId: scenarioIdSchema,
   scenarioRunId: scenarioRunIdSchema,
-  scenarioSetId: import_zod4.z.string().optional().default("default")
+  scenarioSetId: import_zod.z.string().optional().default("default")
 });
 var scenarioRunStartedSchema = baseScenarioEventSchema.extend({
-  type: import_zod4.z.literal("SCENARIO_RUN_STARTED" /* RUN_STARTED */),
-  metadata: import_zod4.z.object({
-    name: import_zod4.z.string().optional(),
-    description: import_zod4.z.string().optional()
+  type: import_zod.z.literal("SCENARIO_RUN_STARTED" /* RUN_STARTED */),
+  metadata: import_zod.z.object({
+    name: import_zod.z.string().optional(),
+    description: import_zod.z.string().optional()
   })
 });
-var scenarioResultsSchema = import_zod4.z.object({
-  verdict: import_zod4.z.nativeEnum(Verdict),
-  reasoning: import_zod4.z.string().optional(),
-  metCriteria: import_zod4.z.array(import_zod4.z.string()),
-  unmetCriteria: import_zod4.z.array(import_zod4.z.string()),
-  error: import_zod4.z.string().optional()
+var scenarioResultsSchema = import_zod.z.object({
+  verdict: import_zod.z.nativeEnum(Verdict),
+  reasoning: import_zod.z.string().optional(),
+  metCriteria: import_zod.z.array(import_zod.z.string()),
+  unmetCriteria: import_zod.z.array(import_zod.z.string()),
+  error: import_zod.z.string().optional()
 });
 var scenarioRunFinishedSchema = baseScenarioEventSchema.extend({
-  type: import_zod4.z.literal("SCENARIO_RUN_FINISHED" /* RUN_FINISHED */),
-  status: import_zod4.z.nativeEnum(ScenarioRunStatus),
+  type: import_zod.z.literal("SCENARIO_RUN_FINISHED" /* RUN_FINISHED */),
+  status: import_zod.z.nativeEnum(ScenarioRunStatus),
   results: scenarioResultsSchema.optional().nullable()
 });
 var scenarioMessageSnapshotSchema = import_core.MessagesSnapshotEventSchema.merge(
   baseScenarioEventSchema.extend({
-    type: import_zod4.z.literal("SCENARIO_MESSAGE_SNAPSHOT" /* MESSAGE_SNAPSHOT */)
+    type: import_zod.z.literal("SCENARIO_MESSAGE_SNAPSHOT" /* MESSAGE_SNAPSHOT */)
   })
 );
-var scenarioEventSchema = import_zod4.z.discriminatedUnion("type", [
+var scenarioEventSchema = import_zod.z.discriminatedUnion("type", [
   scenarioRunStartedSchema,
   scenarioRunFinishedSchema,
   scenarioMessageSnapshotSchema
 ]);
-var successSchema = import_zod4.z.object({ success: import_zod4.z.boolean() });
-var errorSchema = import_zod4.z.object({ error: import_zod4.z.string() });
-var stateSchema = import_zod4.z.object({
-  state: import_zod4.z.object({
-    messages: import_zod4.z.array(import_zod4.z.any()),
-    status: import_zod4.z.string()
+var successSchema = import_zod.z.object({ success: import_zod.z.boolean() });
+var errorSchema = import_zod.z.object({ error: import_zod.z.string() });
+var stateSchema = import_zod.z.object({
+  state: import_zod.z.object({
+    messages: import_zod.z.array(import_zod.z.any()),
+    status: import_zod.z.string()
   })
 });
-var runsSchema = import_zod4.z.object({ runs: import_zod4.z.array(import_zod4.z.string()) });
-var eventsSchema = import_zod4.z.object({ events: import_zod4.z.array(scenarioEventSchema) });
+var runsSchema = import_zod.z.object({ runs: import_zod.z.array(import_zod.z.string()) });
+var eventsSchema = import_zod.z.object({ events: import_zod.z.array(scenarioEventSchema) });
 // src/utils/convert-core-messages-to-agui-messages.ts
-function convertCoreMessagesToAguiMessages(coreMessages) {
+function convertModelMessagesToAguiMessages(modelMessages) {
   const aguiMessages = [];
-  for (const msg of coreMessages) {
+  for (const msg of modelMessages) {
     const id = "id" in msg && typeof msg.id === "string" ? msg.id : generateMessageId();
     switch (true) {
       case msg.role === "system":
@@ -886,7 +886,7 @@ function convertCoreMessagesToAguiMessages(coreMessages) {
             type: "function",
             function: {
               name: c.toolName,
-              arguments: JSON.stringify(c.args)
+              arguments: JSON.stringify(c.input)
             }
           }))
         });
@@ -894,11 +894,12 @@ function convertCoreMessagesToAguiMessages(coreMessages) {
       }
       case msg.role === "tool":
         msg.content.map((p, i) => {
+          var _a;
           aguiMessages.push({
             id: `${id}-${i}`,
             role: "tool",
             toolCallId: p.toolCallId,
-            content: JSON.stringify(p.result)
+            content: JSON.stringify((_a = p.output) == null ? void 0 : _a.value)
           });
         });
         break;
@@ -908,7 +909,7 @@ function convertCoreMessagesToAguiMessages(coreMessages) {
   }
   return aguiMessages;
 }
-var convert_core_messages_to_agui_messages_default = convertCoreMessagesToAguiMessages;
+var convert_core_messages_to_agui_messages_default = convertModelMessagesToAguiMessages;
 // src/execution/scenario-execution.ts
 var ScenarioExecution = class {
@@ -974,7 +975,7 @@ var ScenarioExecution = class {
   /**
    * Gets the complete conversation history as an array of messages.
    *
-   * @returns Array of CoreMessage objects representing the full conversation
+   * @returns Array of ModelMessage objects representing the full conversation
    */
   get messages() {
     return this.state.messages;
@@ -1207,7 +1208,7 @@ var ScenarioExecution = class {
    * - "assistant" messages are routed to AGENT role agents
    * - Other message types are added directly to the conversation
    *
-   * @param message - The CoreMessage to add to the conversation
+   * @param message - The ModelMessage to add to the conversation
    *
    * @example
    * ```typescript
@@ -1236,7 +1237,7 @@ var ScenarioExecution = class {
    *
    * This method is part of the ScenarioExecutionLike interface used by script steps.
    *
-   * @param content - Optional content for the user's message. Can be a string or CoreMessage.
+   * @param content - Optional content for the user's message. Can be a string or ModelMessage.
    *                 If not provided, the user simulator agent will generate the content.
    *
    * @example
@@ -1247,7 +1248,7 @@ var ScenarioExecution = class {
    * // Let user simulator generate content
    * await execution.user();
    *
-   * // Use a CoreMessage object
+   * // Use a ModelMessage object
    * await execution.user({
    *   role: "user",
    *   content: "Tell me a joke"
@@ -1266,7 +1267,7 @@ var ScenarioExecution = class {
    *
    * This method is part of the ScenarioExecutionLike interface used by script steps.
    *
-   * @param content - Optional content for the agent's response. Can be a string or CoreMessage.
+   * @param content - Optional content for the agent's response. Can be a string or ModelMessage.
    *                 If not provided, the agent under test will generate the response.
    *
    * @example
@@ -1277,7 +1278,7 @@ var ScenarioExecution = class {
    * // Use provided content
    * await execution.agent("The weather is sunny today!");
    *
-   * // Use a CoreMessage object
+   * // Use a ModelMessage object
    * await execution.agent({
    *   role: "assistant",
    *   content: "I'm here to help you with weather information."
@@ -1886,9 +1887,27 @@ __export(runner_exports, {
 var import_rxjs3 = require("rxjs");
 // src/events/event-alert-message-logger.ts
+var fs2 = __toESM(require("fs"));
+var os = __toESM(require("os"));
+var path2 = __toESM(require("path"));
 var import_open = __toESM(require("open"));
-var EventAlertMessageLogger = class _EventAlertMessageLogger {
-  static shownBatchIds = /* @__PURE__ */ new Set();
+var EventAlertMessageLogger = class {
+  /**
+   * Creates a coordination file to prevent duplicate messages across processes.
+   * Returns true if this process should show the message (first one to create the file).
+   */
+  createCoordinationFile(type) {
+    try {
+      const batchId = getBatchRunId();
+      const tmpDir = os.tmpdir();
+      const fileName = `scenario-${type}-${batchId}`;
+      const filePath = path2.join(tmpDir, fileName);
+      fs2.writeFileSync(filePath, process.pid.toString(), { flag: "wx" });
+      return true;
+    } catch {
+      return false;
+    }
+  }
   /**
    * Shows a fancy greeting message about simulation reporting status.
    * Only shows once per batch run to avoid spam.
@@ -1897,10 +1916,9 @@ var EventAlertMessageLogger = class _EventAlertMessageLogger {
     if (this.isGreetingDisabled()) {
       return;
     }
-    if (_EventAlertMessageLogger.shownBatchIds.has(getBatchRunId())) {
+    if (!this.createCoordinationFile("greeting")) {
       return;
     }
-    _EventAlertMessageLogger.shownBatchIds.add(getBatchRunId());
     this.displayGreeting();
   }
   /**
@@ -1911,6 +1929,9 @@ var EventAlertMessageLogger = class _EventAlertMessageLogger {
     if (this.isGreetingDisabled()) {
       return;
     }
+    if (!this.createCoordinationFile(`watch-${params.scenarioSetId}`)) {
+      return;
+    }
     await this.displayWatchMessage(params);
   }
   isGreetingDisabled() {
@@ -2254,14 +2275,13 @@ function formatPart(part) {
     case "file":
       return `(file): ${part.filename} ${typeof part.data === "string" ? `url:${part.data}` : "base64:omitted"}`;
     case "tool-call":
-      return `(tool call): ${part.toolName} id:${part.toolCallId} args:(${JSON.stringify(part.args)})`;
+      return `(tool call): ${part.toolName} id:${part.toolCallId} args:(${JSON.stringify(part.input)})`;
     case "tool-result":
-      return `(tool result): ${part.toolName} id:${part.toolCallId} result:(${JSON.stringify(part.result)})`;
+      return `(tool result): ${part.toolName} id:${part.toolCallId} result:(${JSON.stringify(part.output)})`;
     case "reasoning":
       return `(reasoning): ${part.text}`;
-    case "redacted-reasoning":
-      return `(redacted reasoning): ${part.data}`;
     default:
+      part;
       return `Unknown content: ${JSON.stringify(part)}`;
   }
 }

package/dist/index.mjs CHANGED Viewed

@@ -17,11 +17,11 @@ import {
   getBatchRunId,
   getProjectConfig,
   scenarioProjectConfigSchema
-} from "./chunk-6SKQWXT7.mjs";
+} from "./chunk-3Z7E24UI.mjs";
 import {
   Logger,
   getEnv
-} from "./chunk-OL4RFXV4.mjs";
+} from "./chunk-RHTLQKEJ.mjs";
 import {
   __export
 } from "./chunk-7P6ASYW6.mjs";
@@ -35,7 +35,7 @@ __export(agents_exports, {
 // src/agents/judge-agent.ts
 import { generateText, tool } from "ai";
-import { z } from "zod";
+import { z } from "zod/v4";
 // src/agents/utils.ts
 var toolMessageRole = "tool";
@@ -142,14 +142,14 @@ ${criteriaList}
 function buildContinueTestTool() {
   return tool({
     description: "Continue the test with the next step",
-    parameters: z.object({})
+    inputSchema: z.object({})
   });
 }
 function buildFinishTestTool(criteria) {
   const criteriaNames = criteria.map(criterionToParamName);
   return tool({
     description: "Complete the test with a final verdict",
-    parameters: z.object({
+    inputSchema: z.object({
       criteria: z.object(
         Object.fromEntries(
           criteriaNames.map((name, idx) => [
@@ -207,7 +207,7 @@ var JudgeAgent = class extends JudgeAgentAdapter {
       model: mergedConfig.model,
       messages,
       temperature: mergedConfig.temperature ?? 0,
-      maxTokens: mergedConfig.maxTokens,
+      maxOutputTokens: mergedConfig.maxTokens,
       tools,
       toolChoice
     });
@@ -216,7 +216,7 @@ var JudgeAgent = class extends JudgeAgentAdapter {
       const toolCall = completion.toolCalls[0];
       switch (toolCall.toolName) {
         case "finish_test": {
-          args = toolCall.args;
+          args = toolCall.input;
           const verdict = args.verdict || "inconclusive";
           const reasoning = args.reasoning || "No reasoning provided";
           const criteria = args.criteria || {};
@@ -314,7 +314,7 @@ var UserSimulatorAgent = class extends UserSimulatorAgentAdapter {
       model: mergedConfig.model,
       messages: reversedMessages,
       temperature: mergedConfig.temperature ?? DEFAULT_TEMPERATURE,
-      maxTokens: mergedConfig.maxTokens
+      maxOutputTokens: mergedConfig.maxTokens
     });
     const messageContent = completion.text;
     if (!messageContent) {
@@ -441,9 +441,9 @@ var ScenarioExecutionState = class {
 };
 // src/utils/convert-core-messages-to-agui-messages.ts
-function convertCoreMessagesToAguiMessages(coreMessages) {
+function convertModelMessagesToAguiMessages(modelMessages) {
   const aguiMessages = [];
-  for (const msg of coreMessages) {
+  for (const msg of modelMessages) {
     const id = "id" in msg && typeof msg.id === "string" ? msg.id : generateMessageId();
     switch (true) {
       case msg.role === "system":
@@ -487,7 +487,7 @@ function convertCoreMessagesToAguiMessages(coreMessages) {
             type: "function",
             function: {
               name: c.toolName,
-              arguments: JSON.stringify(c.args)
+              arguments: JSON.stringify(c.input)
             }
           }))
         });
@@ -495,11 +495,12 @@ function convertCoreMessagesToAguiMessages(coreMessages) {
       }
       case msg.role === "tool":
         msg.content.map((p, i) => {
+          var _a;
           aguiMessages.push({
             id: `${id}-${i}`,
             role: "tool",
             toolCallId: p.toolCallId,
-            content: JSON.stringify(p.result)
+            content: JSON.stringify((_a = p.output) == null ? void 0 : _a.value)
           });
         });
         break;
@@ -509,7 +510,7 @@ function convertCoreMessagesToAguiMessages(coreMessages) {
   }
   return aguiMessages;
 }
-var convert_core_messages_to_agui_messages_default = convertCoreMessagesToAguiMessages;
+var convert_core_messages_to_agui_messages_default = convertModelMessagesToAguiMessages;
 // src/execution/scenario-execution.ts
 var ScenarioExecution = class {
@@ -575,7 +576,7 @@ var ScenarioExecution = class {
   /**
    * Gets the complete conversation history as an array of messages.
    *
-   * @returns Array of CoreMessage objects representing the full conversation
+   * @returns Array of ModelMessage objects representing the full conversation
    */
   get messages() {
     return this.state.messages;
@@ -808,7 +809,7 @@ var ScenarioExecution = class {
    * - "assistant" messages are routed to AGENT role agents
    * - Other message types are added directly to the conversation
    *
-   * @param message - The CoreMessage to add to the conversation
+   * @param message - The ModelMessage to add to the conversation
    *
    * @example
    * ```typescript
@@ -837,7 +838,7 @@ var ScenarioExecution = class {
    *
    * This method is part of the ScenarioExecutionLike interface used by script steps.
    *
-   * @param content - Optional content for the user's message. Can be a string or CoreMessage.
+   * @param content - Optional content for the user's message. Can be a string or ModelMessage.
    *                 If not provided, the user simulator agent will generate the content.
    *
    * @example
@@ -848,7 +849,7 @@ var ScenarioExecution = class {
    * // Let user simulator generate content
    * await execution.user();
    *
-   * // Use a CoreMessage object
+   * // Use a ModelMessage object
    * await execution.user({
    *   role: "user",
    *   content: "Tell me a joke"
@@ -867,7 +868,7 @@ var ScenarioExecution = class {
    *
    * This method is part of the ScenarioExecutionLike interface used by script steps.
    *
-   * @param content - Optional content for the agent's response. Can be a string or CoreMessage.
+   * @param content - Optional content for the agent's response. Can be a string or ModelMessage.
    *                 If not provided, the agent under test will generate the response.
    *
    * @example
@@ -878,7 +879,7 @@ var ScenarioExecution = class {
    * // Use provided content
    * await execution.agent("The weather is sunny today!");
    *
-   * // Use a CoreMessage object
+   * // Use a ModelMessage object
    * await execution.agent({
    *   role: "assistant",
    *   content: "I'm here to help you with weather information."
@@ -1600,14 +1601,13 @@ function formatPart(part) {
     case "file":
       return `(file): ${part.filename} ${typeof part.data === "string" ? `url:${part.data}` : "base64:omitted"}`;
     case "tool-call":
-      return `(tool call): ${part.toolName} id:${part.toolCallId} args:(${JSON.stringify(part.args)})`;
+      return `(tool call): ${part.toolName} id:${part.toolCallId} args:(${JSON.stringify(part.input)})`;
     case "tool-result":
-      return `(tool result): ${part.toolName} id:${part.toolCallId} result:(${JSON.stringify(part.result)})`;
+      return `(tool result): ${part.toolName} id:${part.toolCallId} result:(${JSON.stringify(part.output)})`;
     case "reasoning":
       return `(reasoning): ${part.text}`;
-    case "redacted-reasoning":
-      return `(redacted reasoning): ${part.data}`;
     default:
+      part;
       return `Unknown content: ${JSON.stringify(part)}`;
   }
 }

package/dist/integrations/vitest/reporter.js CHANGED Viewed

@@ -38,7 +38,7 @@ var import_path = __toESM(require("path"));
 var import_chalk = __toESM(require("chalk"));
 // src/config/env.ts
-var import_zod = require("zod");
+var import_v4 = require("zod/v4");
 // src/config/log-levels.ts
 var LogLevel = /* @__PURE__ */ ((LogLevel2) => {
@@ -51,37 +51,37 @@ var LogLevel = /* @__PURE__ */ ((LogLevel2) => {
 var LOG_LEVELS = Object.values(LogLevel);
 // src/config/env.ts
-var envSchema = import_zod.z.object({
+var envSchema = import_v4.z.object({
   /**
    * LangWatch API key for event reporting.
    * If not provided, events will not be sent to LangWatch.
    */
-  LANGWATCH_API_KEY: import_zod.z.string().optional(),
+  LANGWATCH_API_KEY: import_v4.z.string().optional(),
   /**
    * LangWatch endpoint URL for event reporting.
    * Defaults to the production LangWatch endpoint.
    */
-  LANGWATCH_ENDPOINT: import_zod.z.string().url().optional().default("https://app.langwatch.ai"),
+  LANGWATCH_ENDPOINT: import_v4.z.string().url().optional().default("https://app.langwatch.ai"),
   /**
    * Disables simulation report info messages when set to any truthy value.
    * Useful for CI/CD environments or when you want cleaner output.
    */
-  SCENARIO_DISABLE_SIMULATION_REPORT_INFO: import_zod.z.string().optional().transform((val) => Boolean(val)),
+  SCENARIO_DISABLE_SIMULATION_REPORT_INFO: import_v4.z.string().optional().transform((val) => Boolean(val)),
   /**
    * Node environment - affects logging and behavior.
    * Defaults to 'development' if not specified.
    */
-  NODE_ENV: import_zod.z.enum(["development", "production", "test"]).default("development"),
+  NODE_ENV: import_v4.z.enum(["development", "production", "test"]).default("development"),
   /**
    * Case-insensitive log level for the scenario package.
    * Defaults to 'info' if not specified.
    */
-  LOG_LEVEL: import_zod.z.string().toUpperCase().pipe(import_zod.z.nativeEnum(LogLevel)).optional().default("INFO" /* INFO */),
+  LOG_LEVEL: import_v4.z.string().toUpperCase().pipe(import_v4.z.nativeEnum(LogLevel)).optional().default("INFO" /* INFO */),
   /**
    * Scenario batch run ID.
    * If not provided, a random ID will be generated.
    */
-  SCENARIO_BATCH_RUN_ID: import_zod.z.string().optional()
+  SCENARIO_BATCH_RUN_ID: import_v4.z.string().optional()
 });
 function getEnv() {
   return envSchema.parse(process.env);
@@ -321,8 +321,12 @@ ${indent(parsedJson)}
     console.log();
     console.log(import_chalk.default.bold.cyan("=== Scenario Test Report ==="));
     console.log(`Total Scenarios: ${total}`);
-    console.log(import_chalk.default.green(`Passed: ${passed}`));
-    console.log(import_chalk.default.red(`Failed: ${failed}`));
+    console.log(
+      passed > 0 ? import_chalk.default.green(`Passed: ${passed}`) : `Passed: ${passed}`
+    );
+    console.log(
+      failed > 0 ? import_chalk.default.red(`Failed: ${failed}`) : `Failed: ${failed}`
+    );
     console.log(`Success Rate: ${import_chalk.default.bold(`${successRate}%`)}`);
     this.results.forEach((r, i) => {
       const statusColor = r.status === "SUCCESS" ? import_chalk.default.green : import_chalk.default.red;

package/dist/integrations/vitest/reporter.mjs CHANGED Viewed

@@ -1,6 +1,6 @@
 import {
   Logger
-} from "../../chunk-OL4RFXV4.mjs";
+} from "../../chunk-RHTLQKEJ.mjs";
 import "../../chunk-7P6ASYW6.mjs";
 // src/integrations/vitest/reporter.ts
@@ -161,8 +161,12 @@ ${indent(parsedJson)}
     console.log();
     console.log(chalk.bold.cyan("=== Scenario Test Report ==="));
     console.log(`Total Scenarios: ${total}`);
-    console.log(chalk.green(`Passed: ${passed}`));
-    console.log(chalk.red(`Failed: ${failed}`));
+    console.log(
+      passed > 0 ? chalk.green(`Passed: ${passed}`) : `Passed: ${passed}`
+    );
+    console.log(
+      failed > 0 ? chalk.red(`Failed: ${failed}`) : `Failed: ${failed}`
+    );
     console.log(`Success Rate: ${chalk.bold(`${successRate}%`)}`);
     this.results.forEach((r, i) => {
       const statusColor = r.status === "SUCCESS" ? chalk.green : chalk.red;