npm - @langwatch/scenario - Versions diffs - 0.2.0 → 0.2.2 - Mend

@langwatch/scenario 0.2.0 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/dist/chunk-NUZZAQV2.mjs +622 -0
package/dist/index.d.mts +65 -15
package/dist/index.d.ts +65 -15
package/dist/index.js +317 -97
package/dist/index.mjs +122 -173
package/dist/integrations/vitest/setup.js +282 -105
package/dist/integrations/vitest/setup.mjs +1 -1
package/package.json +4 -3
package/dist/chunk-ORWSJC5F.mjs +0 -309

package/dist/index.mjs CHANGED Viewed

@@ -1,7 +1,23 @@
 import {
+  AgentAdapter,
+  AgentRole,
+  DEFAULT_TEMPERATURE,
   EventBus,
-  Logger
-} from "./chunk-ORWSJC5F.mjs";
+  JudgeAgentAdapter,
+  Logger,
+  UserSimulatorAgentAdapter,
+  allAgentRoles,
+  defineConfig,
+  domain_exports,
+  env,
+  generateMessageId,
+  generateScenarioId,
+  generateScenarioRunId,
+  generateThreadId,
+  getBatchRunId,
+  getProjectConfig,
+  scenarioProjectConfigSchema
+} from "./chunk-NUZZAQV2.mjs";
 import {
   __export
 } from "./chunk-7P6ASYW6.mjs";
@@ -15,61 +31,7 @@ __export(agents_exports, {
 // src/agents/judge-agent.ts
 import { generateText, tool } from "ai";
-import { z as z2 } from "zod";
-// src/domain/index.ts
-var domain_exports = {};
-__export(domain_exports, {
-  AgentAdapter: () => AgentAdapter,
-  AgentRole: () => AgentRole,
-  JudgeAgentAdapter: () => JudgeAgentAdapter,
-  UserSimulatorAgentAdapter: () => UserSimulatorAgentAdapter,
-  allAgentRoles: () => allAgentRoles,
-  defineConfig: () => defineConfig,
-  scenarioProjectConfigSchema: () => scenarioProjectConfigSchema
-});
-// src/domain/core/config.ts
 import { z } from "zod";
-var scenarioProjectConfigSchema = z.object({
-  defaultModel: z.object({
-    model: z.custom(),
-    temperature: z.number().min(0).max(1).optional().default(0),
-    maxTokens: z.number().optional()
-  }).optional(),
-  langwatchEndpoint: z.string().optional(),
-  langwatchApiKey: z.string().optional()
-}).strict();
-function defineConfig(config2) {
-  return config2;
-}
-// src/domain/agents/index.ts
-var AgentRole = /* @__PURE__ */ ((AgentRole2) => {
-  AgentRole2["USER"] = "User";
-  AgentRole2["AGENT"] = "Agent";
-  AgentRole2["JUDGE"] = "Judge";
-  return AgentRole2;
-})(AgentRole || {});
-var allAgentRoles = ["User" /* USER */, "Agent" /* AGENT */, "Judge" /* JUDGE */];
-var AgentAdapter = class {
-  role = "Agent" /* AGENT */;
-  constructor(input) {
-    void input;
-  }
-};
-var UserSimulatorAgentAdapter = class {
-  role = "User" /* USER */;
-  constructor(input) {
-    void input;
-  }
-};
-var JudgeAgentAdapter = class {
-  role = "Judge" /* JUDGE */;
-  constructor(input) {
-    void input;
-  }
-};
 // src/agents/utils.ts
 var toolMessageRole = "tool";
@@ -126,81 +88,19 @@ var criterionToParamName = (criterion) => {
   return criterion.replace(/"/g, "").replace(/[^a-zA-Z0-9]/g, "_").replace(/ /g, "_").toLowerCase().substring(0, 70);
 };
-// src/config/load.ts
-import fs from "node:fs/promises";
-import path from "node:path";
-import { pathToFileURL } from "node:url";
-async function loadScenarioProjectConfig() {
-  const cwd = process.cwd();
-  const configNames = [
-    "scenario.config.js",
-    "scenario.config.mjs"
-  ];
-  for (const name of configNames) {
-    const fullPath = path.join(cwd, name);
-    try {
-      await fs.access(fullPath);
-      const configModule = await import(pathToFileURL(fullPath).href);
-      const config2 = configModule.default || configModule;
-      const parsed = scenarioProjectConfigSchema.safeParse(config2);
-      if (!parsed.success) {
-        throw new Error(
-          `Invalid config file ${name}: ${JSON.stringify(parsed.error.format(), null, 2)}`
-        );
-      }
-      return parsed.data;
-    } catch (error) {
-      if (error instanceof Error && "code" in error && error.code === "ENOENT") {
-        continue;
-      }
-      throw error;
-    }
-  }
-  return await scenarioProjectConfigSchema.parseAsync({});
-}
-// src/config/index.ts
-var logger = new Logger("scenario.config");
-var configLoaded = false;
-var config = null;
-var configLoadPromise = null;
-async function loadProjectConfig() {
-  if (configLoaded) {
-    return;
-  }
-  if (configLoadPromise) {
-    return configLoadPromise;
-  }
-  configLoadPromise = (async () => {
-    try {
-      config = await loadScenarioProjectConfig();
-      logger.info("loaded scenario project config", { config });
-    } catch (error) {
-      logger.error("error loading scenario project config", { error });
-    } finally {
-      configLoaded = true;
-    }
-  })();
-  return configLoadPromise;
-}
-async function getProjectConfig() {
-  await loadProjectConfig();
-  return config;
-}
 // src/utils/config.ts
-function mergeConfig(config2, projectConfig) {
+function mergeConfig(config, projectConfig) {
   if (!projectConfig) {
-    return config2;
+    return config;
   }
   return {
     ...projectConfig.defaultModel,
-    ...config2
+    ...config
   };
 }
-function mergeAndValidateConfig(config2, projectConfig) {
+function mergeAndValidateConfig(config, projectConfig) {
   var _a;
-  const mergedConfig = mergeConfig(config2, projectConfig);
+  const mergedConfig = mergeConfig(config, projectConfig);
   mergedConfig.model = mergedConfig.model ?? ((_a = projectConfig == null ? void 0 : projectConfig.defaultModel) == null ? void 0 : _a.model);
   if (!mergedConfig.model) {
     throw new Error("Model is required");
@@ -238,24 +138,24 @@ ${criteriaList}
 function buildContinueTestTool() {
   return tool({
     description: "Continue the test with the next step",
-    parameters: z2.object({})
+    parameters: z.object({})
   });
 }
 function buildFinishTestTool(criteria) {
   const criteriaNames = criteria.map(criterionToParamName);
   return tool({
     description: "Complete the test with a final verdict",
-    parameters: z2.object({
-      criteria: z2.object(
+    parameters: z.object({
+      criteria: z.object(
         Object.fromEntries(
           criteriaNames.map((name, idx) => [
             name,
-            z2.enum(["true", "false", "inconclusive"]).describe(criteria[idx])
+            z.enum(["true", "false", "inconclusive"]).describe(criteria[idx])
           ])
         )
       ).strict().describe("Strict verdict for each criterion"),
-      reasoning: z2.string().describe("Explanation of what the final verdict should be"),
-      verdict: z2.enum(["success", "failure", "inconclusive"]).describe("The final verdict of the test")
+      reasoning: z.string().describe("Explanation of what the final verdict should be"),
+      verdict: z.enum(["success", "failure", "inconclusive"]).describe("The final verdict of the test")
     })
   });
 }
@@ -365,18 +265,18 @@ ${description}
 </rules>
 `.trim();
 }
-var userSimulatorAgent = (config2) => {
+var userSimulatorAgent = (config) => {
   return {
     role: "User" /* USER */,
     call: async (input) => {
-      const systemPrompt = buildSystemPrompt2(input.scenarioConfig.description);
+      const systemPrompt = (config == null ? void 0 : config.systemPrompt) ?? buildSystemPrompt2(input.scenarioConfig.description);
       const messages = [
         { role: "system", content: systemPrompt },
         { role: "assistant", content: "Hello, how can I help you today" },
         ...input.messages
       ];
       const projectConfig = await getProjectConfig();
-      const mergedConfig = mergeAndValidateConfig(config2 ?? {}, projectConfig);
+      const mergedConfig = mergeAndValidateConfig(config ?? {}, projectConfig);
       if (!mergedConfig.model) {
         throw new Error("Model is required for the user simulator agent");
       }
@@ -384,7 +284,7 @@ var userSimulatorAgent = (config2) => {
       const completion = await generateText2({
         model: mergedConfig.model,
         messages: reversedMessages,
-        temperature: mergedConfig.temperature ?? 0,
+        temperature: mergedConfig.temperature ?? DEFAULT_TEMPERATURE,
         maxTokens: mergedConfig.maxTokens
       });
       const messageContent = completion.text;
@@ -406,28 +306,6 @@ __export(execution_exports, {
 // src/execution/scenario-execution.ts
 import { Subject } from "rxjs";
-// src/utils/ids.ts
-import { generate, parse } from "xksuid";
-var batchRunId = null;
-function generateThreadId() {
-  return `thread_${generate()}`;
-}
-function generateScenarioRunId() {
-  return `scenariorun_${generate()}`;
-}
-function generateScenarioId() {
-  return `scenario_${generate()}`;
-}
-function getBatchRunId() {
-  if (!batchRunId) {
-    batchRunId = process.env.SCENARIO_BATCH_RUN_ID ?? `scenariobatchrun_${generate()}`;
-  }
-  return batchRunId;
-}
-function generateMessageId() {
-  return `scenariomsg_${generate()}`;
-}
 // src/execution/scenario-execution-state.ts
 var ScenarioExecutionState = class {
   _messages = [];
@@ -435,9 +313,9 @@ var ScenarioExecutionState = class {
   _threadId = "";
   description;
   config;
-  constructor(config2) {
-    this.config = config2;
-    this.description = config2.description;
+  constructor(config) {
+    this.config = config;
+    this.description = config.description;
   }
   get messages() {
     return this._messages;
@@ -499,8 +377,79 @@ var ScenarioExecutionState = class {
   }
 };
+// src/utils/message-conversion.ts
+function convertCoreMessagesToAguiMessages(coreMessages) {
+  const aguiMessages = [];
+  for (const msg of coreMessages) {
+    const id = "id" in msg && typeof msg.id === "string" ? msg.id : generateMessageId();
+    switch (true) {
+      case msg.role === "system":
+        aguiMessages.push({
+          id,
+          role: "system",
+          content: msg.content
+        });
+        break;
+      case (msg.role === "user" && typeof msg.content === "string"):
+        aguiMessages.push({
+          id,
+          role: "user",
+          content: msg.content
+        });
+        break;
+      // Handle any other user message content format
+      case (msg.role === "user" && Array.isArray(msg.content)):
+        aguiMessages.push({
+          id,
+          role: "user",
+          content: JSON.stringify(msg.content)
+        });
+        break;
+      case (msg.role === "assistant" && typeof msg.content === "string"):
+        aguiMessages.push({
+          id,
+          role: "assistant",
+          content: msg.content
+        });
+        break;
+      case (msg.role === "assistant" && Array.isArray(msg.content)): {
+        const toolCalls = msg.content.filter((p) => p.type === "tool-call");
+        const nonToolCalls = msg.content.filter((p) => p.type !== "tool-call");
+        aguiMessages.push({
+          id,
+          role: "assistant",
+          content: JSON.stringify(nonToolCalls),
+          toolCalls: toolCalls.map((c) => ({
+            id: c.toolCallId,
+            type: "function",
+            function: {
+              name: c.toolName,
+              arguments: JSON.stringify(c.args)
+            }
+          }))
+        });
+        break;
+      }
+      case msg.role === "tool":
+        msg.content.map((p, i) => {
+          aguiMessages.push({
+            id: `${id}-${i}`,
+            role: "tool",
+            toolCallId: p.toolCallId,
+            content: JSON.stringify(p.result)
+          });
+        });
+        break;
+      default:
+        throw new Error(`Unsupported message role: ${msg.role}`);
+    }
+  }
+  return aguiMessages;
+}
+var message_conversion_default = convertCoreMessagesToAguiMessages;
 // src/execution/scenario-execution.ts
-var batchRunId2 = getBatchRunId();
+var batchRunId = getBatchRunId();
 var ScenarioExecution = class {
   state;
   eventSubject = new Subject();
@@ -523,17 +472,17 @@ var ScenarioExecution = class {
    * @param config The scenario configuration.
    * @param script The script steps to execute.
    */
-  constructor(config2, script) {
+  constructor(config, script) {
     this.config = {
-      id: config2.id ?? generateScenarioId(),
-      name: config2.name,
-      description: config2.description,
-      agents: config2.agents,
+      id: config.id ?? generateScenarioId(),
+      name: config.name,
+      description: config.description,
+      agents: config.agents,
       script,
-      verbose: config2.verbose ?? false,
-      maxTurns: config2.maxTurns ?? 10,
-      threadId: config2.threadId ?? generateThreadId(),
-      setId: config2.setId
+      verbose: config.verbose ?? false,
+      maxTurns: config.maxTurns ?? 10,
+      threadId: config.threadId ?? generateThreadId(),
+      setId: config.setId
     };
     this.state = new ScenarioExecutionState(this.config);
     this.reset();
@@ -912,7 +861,7 @@ var ScenarioExecution = class {
       type: "placeholder",
       // This will be replaced by the specific event type
       timestamp: Date.now(),
-      batchRunId: batchRunId2,
+      batchRunId,
       scenarioId: this.config.id,
       scenarioRunId,
       scenarioSetId: this.config.setId
@@ -938,7 +887,7 @@ var ScenarioExecution = class {
     this.emitEvent({
       ...this.makeBaseEvent({ scenarioRunId }),
       type: "SCENARIO_MESSAGE_SNAPSHOT" /* MESSAGE_SNAPSHOT */,
-      messages: this.state.messages
+      messages: message_conversion_default(this.state.messages)
       // Add any other required fields from MessagesSnapshotEventSchema
     });
   }
@@ -1061,10 +1010,9 @@ async function run(cfg) {
   let eventBus = null;
   let subscription = null;
   try {
-    const projectConfig = await loadScenarioProjectConfig();
     eventBus = new EventBus({
-      endpoint: projectConfig.langwatchEndpoint ?? process.env.LANGWATCH_ENDPOINT ?? "https://app.langwatch.ai",
-      apiKey: projectConfig.langwatchApiKey ?? process.env.LANGWATCH_API_KEY
+      endpoint: env.LANGWATCH_ENDPOINT,
+      apiKey: env.LANGWATCH_API_KEY
     });
     eventBus.listen();
     subscription = eventBus.subscribeTo(execution.events$);
@@ -1139,6 +1087,7 @@ var index_default = scenario;
 export {
   AgentAdapter,
   AgentRole,
+  DEFAULT_TEMPERATURE,
   JudgeAgentAdapter,
   ScenarioExecution,
   ScenarioExecutionState,