npm - @langwatch/scenario - Versions diffs - 0.4.2 → 0.4.3 - Mend

@langwatch/scenario 0.4.2 → 0.4.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/README.md +2 -2
package/dist/index.d.mts +176 -20
package/dist/index.d.ts +176 -20
package/dist/index.js +2677 -1990
package/dist/index.mjs +2659 -1974
package/dist/integrations/vitest/setup.js +5 -2
package/dist/integrations/vitest/setup.mjs +5 -2
package/package.json +3 -2

package/README.md CHANGED Viewed

@@ -97,7 +97,7 @@ describe("Weather Agent", () => {
       role: AgentRole.AGENT,
       call: async (input) => {
         const response = await generateText({
-          model: openai("gpt-4.1"),
+          model: openai("gpt-4.1-mini"),
           system: `You are a helpful assistant that may help the user with weather information.`,
           messages: input.messages,
           tools: { get_current_weather: getCurrentWeather },
@@ -150,7 +150,7 @@ describe("Weather Agent", () => {
         "The user asks for the weather in a specific city, and the agent should use the weather tool to find it.",
       agents: [
         weatherAgent,
-        scenario.userSimulatorAgent({ model: openai("gpt-4.1") }),
+        scenario.userSimulatorAgent({ model: openai("gpt-4.1-mini") }),
       ],
       script: [
         scenario.user("What's the weather like in Barcelona?"),

package/dist/index.d.mts CHANGED Viewed

@@ -3,6 +3,7 @@ import { ModelMessage, UserModelMessage, AssistantModelMessage, ToolModelMessage
 import { z } from 'zod/v4';
 import { SpanProcessor, ReadableSpan } from '@opentelemetry/sdk-trace-base';
 import { RealtimeSession } from '@openai/agents/realtime';
+import { SetupObservabilityOptions } from 'langwatch/observability/node';
 import { Observable } from 'rxjs';
 import { z as z$1 } from 'zod';
@@ -178,6 +179,12 @@ interface ScenarioConfig {
      * If not provided, the scenario will not be grouped into a set.
      */
     setId?: string;
+    /**
+     * Optional metadata to attach to the scenario run.
+     * Accepts arbitrary key-value pairs (e.g. prompt IDs, environments, versions).
+     * The `langwatch` key is reserved for platform-internal use.
+     */
+    metadata?: Record<string, unknown>;
 }
 /**
  * Final, normalized scenario configuration.
@@ -265,6 +272,10 @@ type ScriptStep = (state: ScenarioExecutionStateLike, executor: ScenarioExecutio
  *
  */
 interface ScenarioResult {
+    /**
+     * Unique identifier for this scenario run.
+     */
+    runId: string;
     /**
      * Indicates whether the scenario was successful.
      */
@@ -357,6 +368,13 @@ interface ScenarioExecutionStateLike {
     hasToolCall(toolName: string): boolean;
 }
+/**
+ * Schema for the scenario project configuration file (scenario.config.js).
+ *
+ * The `observability` field accepts a subset of `SetupObservabilityOptions`
+ * from the langwatch SDK. It uses `z.custom()` to avoid strict validation
+ * on the passthrough object while keeping the outer config strict.
+ */
 declare const scenarioProjectConfigSchema: z.ZodObject<{
     defaultModel: z.ZodOptional<z.ZodObject<{
         model: z.ZodCustom<ai.LanguageModel, ai.LanguageModel>;
@@ -364,6 +382,7 @@ declare const scenarioProjectConfigSchema: z.ZodObject<{
         maxTokens: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>>;
     headless: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+    observability: z.ZodOptional<z.ZodCustom<Partial<SetupObservabilityOptions>, Partial<SetupObservabilityOptions>>>;
 }, z.core.$strict>;
 type ScenarioProjectConfig = z.infer<typeof scenarioProjectConfigSchema>;
 declare function defineConfig(config: ScenarioProjectConfig): ScenarioProjectConfig;
@@ -467,6 +486,13 @@ declare class JudgeSpanCollector implements SpanProcessor {
     onEnd(span: ReadableSpan): void;
     forceFlush(): Promise<void>;
     shutdown(): Promise<void>;
+    /**
+     * Removes all spans associated with a specific thread.
+     * Call this after a scenario run completes to prevent memory growth
+     * in long-lived processes.
+     * @param threadId - The thread identifier whose spans should be cleared
+     */
+    clearSpansForThread(threadId: string): void;
     /**
      * Retrieves all spans associated with a specific thread.
      * @param threadId - The thread identifier to filter spans by
@@ -914,35 +940,39 @@ declare const scenarioEventSchema: z$1.ZodDiscriminatedUnion<"type", [z$1.ZodObj
     metadata: z$1.ZodObject<{
         name: z$1.ZodOptional<z$1.ZodString>;
         description: z$1.ZodOptional<z$1.ZodString>;
-    }, "strip", z$1.ZodTypeAny, {
-        description?: string | undefined;
-        name?: string | undefined;
-    }, {
-        description?: string | undefined;
-        name?: string | undefined;
-    }>;
+    }, "strip", z$1.ZodUnknown, z$1.objectOutputType<{
+        name: z$1.ZodOptional<z$1.ZodString>;
+        description: z$1.ZodOptional<z$1.ZodString>;
+    }, z$1.ZodUnknown, "strip">, z$1.objectInputType<{
+        name: z$1.ZodOptional<z$1.ZodString>;
+        description: z$1.ZodOptional<z$1.ZodString>;
+    }, z$1.ZodUnknown, "strip">>;
 }, "strip", z$1.ZodTypeAny, {
     type: ScenarioEventType.RUN_STARTED;
+    metadata: {
+        name?: string | undefined;
+        description?: string | undefined;
+    } & {
+        [k: string]: unknown;
+    };
     timestamp: number;
     batchRunId: string;
     scenarioId: string;
     scenarioRunId: string;
     scenarioSetId: string;
-    metadata: {
-        description?: string | undefined;
-        name?: string | undefined;
-    };
     rawEvent?: any;
 }, {
     type: ScenarioEventType.RUN_STARTED;
+    metadata: {
+        name?: string | undefined;
+        description?: string | undefined;
+    } & {
+        [k: string]: unknown;
+    };
     timestamp: number;
     batchRunId: string;
     scenarioId: string;
     scenarioRunId: string;
-    metadata: {
-        description?: string | undefined;
-        name?: string | undefined;
-    };
     rawEvent?: any;
     scenarioSetId?: string | undefined;
 }>, z$1.ZodObject<{
@@ -1363,13 +1393,18 @@ declare class ScenarioExecution implements ScenarioExecutionLike {
      * - RUN_FINISHED: When scenario execution completes (success/failure/error)
      */
     readonly events$: Observable<ScenarioEvent>;
+    /** Batch run ID for grouping scenario runs */
+    private batchRunId;
+    /** The run ID for the current execution */
+    private scenarioRunId?;
     /**
      * Creates a new ScenarioExecution instance.
      *
      * @param config - The scenario configuration containing agents, settings, and metadata
      * @param script - The ordered sequence of script steps that define the test flow
+     * @param batchRunId - Batch run ID for grouping scenario runs
      */
-    constructor(config: ScenarioConfig, script: ScriptStep[]);
+    constructor(config: ScenarioConfig, script: ScriptStep[], batchRunId: string);
     /**
      * Gets the complete conversation history as an array of messages.
      *
@@ -1728,7 +1763,7 @@ declare class ScenarioExecution implements ScenarioExecutionLike {
      * - Creates a new ScenarioExecutionState with the current config
      * - Sets up the thread ID (generates new one if not provided)
      * - Initializes all agents
-     * - Starts the first turn
+     * - Initializes turn state (pending agents/roles) without creating a trace span
      * - Records the start time for performance tracking
      * - Clears any pending messages
      * - Clears the result from any previous execution
@@ -1907,6 +1942,25 @@ declare namespace execution {
   export { execution_ScenarioExecution as ScenarioExecution, execution_ScenarioExecutionState as ScenarioExecutionState, type execution_StateChangeEvent as StateChangeEvent, execution_StateChangeEventType as StateChangeEventType };
 }
+/**
+ * Configuration for LangWatch event reporting.
+ * All fields are optional — any omitted fields fall back to environment variables.
+ */
+interface LangwatchConfig {
+    /** The endpoint URL to send events to. Falls back to LANGWATCH_ENDPOINT env var. */
+    endpoint?: string;
+    /** The API key for authentication. Falls back to LANGWATCH_API_KEY env var. */
+    apiKey?: string;
+}
+/**
+ * Options for running a scenario.
+ */
+interface RunOptions {
+    /** LangWatch configuration for event reporting. Overrides environment variables. */
+    langwatch?: LangwatchConfig;
+    /** Batch run ID for grouping scenario runs. Overrides SCENARIO_BATCH_RUN_ID env var. */
+    batchRunId?: string;
+}
 /**
  * High-level interface for running a scenario test.
  *
@@ -1956,11 +2010,13 @@ declare namespace execution {
  * main();
  * ```
  */
-declare function run(cfg: ScenarioConfig): Promise<ScenarioResult>;
+declare function run(cfg: ScenarioConfig, options?: RunOptions): Promise<ScenarioResult>;
+type runner_LangwatchConfig = LangwatchConfig;
+type runner_RunOptions = RunOptions;
 declare const runner_run: typeof run;
 declare namespace runner {
-  export { runner_run as run };
+  export { type runner_LangwatchConfig as LangwatchConfig, type runner_RunOptions as RunOptions, runner_run as run };
 }
 /**
@@ -2068,7 +2124,107 @@ declare namespace script {
   export { script_agent as agent, script_fail as fail, script_judge as judge, script_message as message, script_proceed as proceed, script_succeed as succeed, script_user as user };
 }
+/**
+ * Explicitly set up tracing for @langwatch/scenario.
+ *
+ * Call this before any `run()` invocations when you want full control
+ * over the observability configuration. If called, `run()` will skip
+ * its own lazy initialization.
+ *
+ * The `judgeSpanCollector` is always added as a span processor regardless
+ * of the user-provided options.
+ *
+ * @param options - Optional `SetupObservabilityOptions` forwarded to the
+ *   langwatch SDK `setupObservability()` function.
+ *
+ * @example
+ * ```typescript
+ * import { setupScenarioTracing } from "@langwatch/scenario";
+ *
+ * setupScenarioTracing({
+ *   instrumentations: [],          // disable auto-instrumentation
+ *   spanProcessors: [myProcessor], // add custom processors
+ * });
+ * ```
+ */
+declare function setupScenarioTracing(options?: Partial<SetupObservabilityOptions>): void;
+/**
+ * Criteria for matching spans by instrumentation scope name or span name.
+ * Within each field, matchers use OR semantics (any match succeeds).
+ * Across fields, AND semantics apply (all specified fields must match).
+ */
+interface TraceFilterCriteria {
+    instrumentationScopeName?: TraceFilterMatch[];
+    name?: TraceFilterMatch[];
+}
+/**
+ * A single match rule for string comparison.
+ */
+interface TraceFilterMatch {
+    equals?: string;
+    startsWith?: string;
+    matches?: RegExp;
+    ignoreCase?: boolean;
+}
+/**
+ * A filter rule for controlling which spans are exported.
+ *
+ * Compatible with the langwatch SDK's `TraceFilter` type used by
+ * `LangWatchTraceExporter`.
+ */
+type TraceFilter = {
+    preset: "vercelAIOnly" | "excludeHttpRequests";
+} | {
+    include: TraceFilterCriteria;
+} | {
+    exclude: TraceFilterCriteria;
+};
+/**
+ * Preset filter that only keeps spans from the @langwatch/scenario instrumentation scope.
+ * Use this to prevent unrelated server spans (HTTP, middleware, etc.) from being exported.
+ *
+ * @example
+ * ```typescript
+ * import { defineConfig, scenarioOnly } from "@langwatch/scenario";
+ * import { LangWatchTraceExporter } from "langwatch/observability";
+ *
+ * export default defineConfig({
+ *   observability: {
+ *     traceExporter: new LangWatchTraceExporter({
+ *       filters: scenarioOnly,
+ *     }),
+ *     instrumentations: [], // disable auto-instrumentation
+ *   },
+ * });
+ * ```
+ */
+declare const scenarioOnly: TraceFilter[];
+/**
+ * Creates a filter that keeps spans from the @langwatch/scenario scope
+ * plus any additional custom instrumentation scopes.
+ *
+ * @param scopes - Additional instrumentation scope names to include
+ * @returns Array of TraceFilter rules
+ *
+ * @example
+ * ```typescript
+ * import { defineConfig, withCustomScopes } from "@langwatch/scenario";
+ * import { LangWatchTraceExporter } from "langwatch/observability";
+ *
+ * export default defineConfig({
+ *   observability: {
+ *     traceExporter: new LangWatchTraceExporter({
+ *       filters: withCustomScopes("my-app/database", "my-app/agent"),
+ *     }),
+ *     instrumentations: [], // disable auto-instrumentation
+ *   },
+ * });
+ * ```
+ */
+declare function withCustomScopes(...scopes: string[]): TraceFilter[];
 type ScenarioApi = typeof agents & typeof domain & typeof execution & typeof runner & typeof script;
 declare const scenario: ScenarioApi;
-export { AgentAdapter, type AgentInput, type AgentReturnTypes, AgentRole, type AudioResponseEvent, DEFAULT_MAX_TURNS, DEFAULT_VERBOSE, type FinishTestArgs, type InvokeLLMParams, type InvokeLLMResult, JudgeAgentAdapter, type JudgeAgentConfig, type JudgeResult, JudgeSpanCollector, JudgeSpanDigestFormatter, type JudgmentRequest, RealtimeAgentAdapter, type RealtimeAgentAdapterConfig, type ScenarioConfig, type ScenarioConfigFinal, ScenarioExecution, type ScenarioExecutionLike, ScenarioExecutionState, type ScenarioExecutionStateLike, type ScenarioProjectConfig, type ScenarioResult, type ScriptStep, type StateChangeEvent, StateChangeEventType, type TestingAgentConfig, UserSimulatorAgentAdapter, agent, allAgentRoles, scenario as default, defineConfig, fail, judge, judgeAgent, judgeSpanCollector, judgeSpanDigestFormatter, message, proceed, run, scenario, scenarioProjectConfigSchema, succeed, user, userSimulatorAgent };
+export { AgentAdapter, type AgentInput, type AgentReturnTypes, AgentRole, type AudioResponseEvent, DEFAULT_MAX_TURNS, DEFAULT_VERBOSE, type FinishTestArgs, type InvokeLLMParams, type InvokeLLMResult, JudgeAgentAdapter, type JudgeAgentConfig, type JudgeResult, JudgeSpanCollector, JudgeSpanDigestFormatter, type JudgmentRequest, type LangwatchConfig, RealtimeAgentAdapter, type RealtimeAgentAdapterConfig, type RunOptions, type ScenarioConfig, type ScenarioConfigFinal, ScenarioExecution, type ScenarioExecutionLike, ScenarioExecutionState, type ScenarioExecutionStateLike, type ScenarioProjectConfig, type ScenarioResult, type ScriptStep, type StateChangeEvent, StateChangeEventType, type TestingAgentConfig, UserSimulatorAgentAdapter, agent, allAgentRoles, scenario as default, defineConfig, fail, judge, judgeAgent, judgeSpanCollector, judgeSpanDigestFormatter, message, proceed, run, scenario, scenarioOnly, scenarioProjectConfigSchema, setupScenarioTracing, succeed, user, userSimulatorAgent, withCustomScopes };

package/dist/index.d.ts CHANGED Viewed

@@ -3,6 +3,7 @@ import { ModelMessage, UserModelMessage, AssistantModelMessage, ToolModelMessage
 import { z } from 'zod/v4';
 import { SpanProcessor, ReadableSpan } from '@opentelemetry/sdk-trace-base';
 import { RealtimeSession } from '@openai/agents/realtime';
+import { SetupObservabilityOptions } from 'langwatch/observability/node';
 import { Observable } from 'rxjs';
 import { z as z$1 } from 'zod';
@@ -178,6 +179,12 @@ interface ScenarioConfig {
      * If not provided, the scenario will not be grouped into a set.
      */
     setId?: string;
+    /**
+     * Optional metadata to attach to the scenario run.
+     * Accepts arbitrary key-value pairs (e.g. prompt IDs, environments, versions).
+     * The `langwatch` key is reserved for platform-internal use.
+     */
+    metadata?: Record<string, unknown>;
 }
 /**
  * Final, normalized scenario configuration.
@@ -265,6 +272,10 @@ type ScriptStep = (state: ScenarioExecutionStateLike, executor: ScenarioExecutio
  *
  */
 interface ScenarioResult {
+    /**
+     * Unique identifier for this scenario run.
+     */
+    runId: string;
     /**
      * Indicates whether the scenario was successful.
      */
@@ -357,6 +368,13 @@ interface ScenarioExecutionStateLike {
     hasToolCall(toolName: string): boolean;
 }
+/**
+ * Schema for the scenario project configuration file (scenario.config.js).
+ *
+ * The `observability` field accepts a subset of `SetupObservabilityOptions`
+ * from the langwatch SDK. It uses `z.custom()` to avoid strict validation
+ * on the passthrough object while keeping the outer config strict.
+ */
 declare const scenarioProjectConfigSchema: z.ZodObject<{
     defaultModel: z.ZodOptional<z.ZodObject<{
         model: z.ZodCustom<ai.LanguageModel, ai.LanguageModel>;
@@ -364,6 +382,7 @@ declare const scenarioProjectConfigSchema: z.ZodObject<{
         maxTokens: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>>;
     headless: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+    observability: z.ZodOptional<z.ZodCustom<Partial<SetupObservabilityOptions>, Partial<SetupObservabilityOptions>>>;
 }, z.core.$strict>;
 type ScenarioProjectConfig = z.infer<typeof scenarioProjectConfigSchema>;
 declare function defineConfig(config: ScenarioProjectConfig): ScenarioProjectConfig;
@@ -467,6 +486,13 @@ declare class JudgeSpanCollector implements SpanProcessor {
     onEnd(span: ReadableSpan): void;
     forceFlush(): Promise<void>;
     shutdown(): Promise<void>;
+    /**
+     * Removes all spans associated with a specific thread.
+     * Call this after a scenario run completes to prevent memory growth
+     * in long-lived processes.
+     * @param threadId - The thread identifier whose spans should be cleared
+     */
+    clearSpansForThread(threadId: string): void;
     /**
      * Retrieves all spans associated with a specific thread.
      * @param threadId - The thread identifier to filter spans by
@@ -914,35 +940,39 @@ declare const scenarioEventSchema: z$1.ZodDiscriminatedUnion<"type", [z$1.ZodObj
     metadata: z$1.ZodObject<{
         name: z$1.ZodOptional<z$1.ZodString>;
         description: z$1.ZodOptional<z$1.ZodString>;
-    }, "strip", z$1.ZodTypeAny, {
-        description?: string | undefined;
-        name?: string | undefined;
-    }, {
-        description?: string | undefined;
-        name?: string | undefined;
-    }>;
+    }, "strip", z$1.ZodUnknown, z$1.objectOutputType<{
+        name: z$1.ZodOptional<z$1.ZodString>;
+        description: z$1.ZodOptional<z$1.ZodString>;
+    }, z$1.ZodUnknown, "strip">, z$1.objectInputType<{
+        name: z$1.ZodOptional<z$1.ZodString>;
+        description: z$1.ZodOptional<z$1.ZodString>;
+    }, z$1.ZodUnknown, "strip">>;
 }, "strip", z$1.ZodTypeAny, {
     type: ScenarioEventType.RUN_STARTED;
+    metadata: {
+        name?: string | undefined;
+        description?: string | undefined;
+    } & {
+        [k: string]: unknown;
+    };
     timestamp: number;
     batchRunId: string;
     scenarioId: string;
     scenarioRunId: string;
     scenarioSetId: string;
-    metadata: {
-        description?: string | undefined;
-        name?: string | undefined;
-    };
     rawEvent?: any;
 }, {
     type: ScenarioEventType.RUN_STARTED;
+    metadata: {
+        name?: string | undefined;
+        description?: string | undefined;
+    } & {
+        [k: string]: unknown;
+    };
     timestamp: number;
     batchRunId: string;
     scenarioId: string;
     scenarioRunId: string;
-    metadata: {
-        description?: string | undefined;
-        name?: string | undefined;
-    };
     rawEvent?: any;
     scenarioSetId?: string | undefined;
 }>, z$1.ZodObject<{
@@ -1363,13 +1393,18 @@ declare class ScenarioExecution implements ScenarioExecutionLike {
      * - RUN_FINISHED: When scenario execution completes (success/failure/error)
      */
     readonly events$: Observable<ScenarioEvent>;
+    /** Batch run ID for grouping scenario runs */
+    private batchRunId;
+    /** The run ID for the current execution */
+    private scenarioRunId?;
     /**
      * Creates a new ScenarioExecution instance.
      *
      * @param config - The scenario configuration containing agents, settings, and metadata
      * @param script - The ordered sequence of script steps that define the test flow
+     * @param batchRunId - Batch run ID for grouping scenario runs
      */
-    constructor(config: ScenarioConfig, script: ScriptStep[]);
+    constructor(config: ScenarioConfig, script: ScriptStep[], batchRunId: string);
     /**
      * Gets the complete conversation history as an array of messages.
      *
@@ -1728,7 +1763,7 @@ declare class ScenarioExecution implements ScenarioExecutionLike {
      * - Creates a new ScenarioExecutionState with the current config
      * - Sets up the thread ID (generates new one if not provided)
      * - Initializes all agents
-     * - Starts the first turn
+     * - Initializes turn state (pending agents/roles) without creating a trace span
      * - Records the start time for performance tracking
      * - Clears any pending messages
      * - Clears the result from any previous execution
@@ -1907,6 +1942,25 @@ declare namespace execution {
   export { execution_ScenarioExecution as ScenarioExecution, execution_ScenarioExecutionState as ScenarioExecutionState, type execution_StateChangeEvent as StateChangeEvent, execution_StateChangeEventType as StateChangeEventType };
 }
+/**
+ * Configuration for LangWatch event reporting.
+ * All fields are optional — any omitted fields fall back to environment variables.
+ */
+interface LangwatchConfig {
+    /** The endpoint URL to send events to. Falls back to LANGWATCH_ENDPOINT env var. */
+    endpoint?: string;
+    /** The API key for authentication. Falls back to LANGWATCH_API_KEY env var. */
+    apiKey?: string;
+}
+/**
+ * Options for running a scenario.
+ */
+interface RunOptions {
+    /** LangWatch configuration for event reporting. Overrides environment variables. */
+    langwatch?: LangwatchConfig;
+    /** Batch run ID for grouping scenario runs. Overrides SCENARIO_BATCH_RUN_ID env var. */
+    batchRunId?: string;
+}
 /**
  * High-level interface for running a scenario test.
  *
@@ -1956,11 +2010,13 @@ declare namespace execution {
  * main();
  * ```
  */
-declare function run(cfg: ScenarioConfig): Promise<ScenarioResult>;
+declare function run(cfg: ScenarioConfig, options?: RunOptions): Promise<ScenarioResult>;
+type runner_LangwatchConfig = LangwatchConfig;
+type runner_RunOptions = RunOptions;
 declare const runner_run: typeof run;
 declare namespace runner {
-  export { runner_run as run };
+  export { type runner_LangwatchConfig as LangwatchConfig, type runner_RunOptions as RunOptions, runner_run as run };
 }
 /**
@@ -2068,7 +2124,107 @@ declare namespace script {
   export { script_agent as agent, script_fail as fail, script_judge as judge, script_message as message, script_proceed as proceed, script_succeed as succeed, script_user as user };
 }
+/**
+ * Explicitly set up tracing for @langwatch/scenario.
+ *
+ * Call this before any `run()` invocations when you want full control
+ * over the observability configuration. If called, `run()` will skip
+ * its own lazy initialization.
+ *
+ * The `judgeSpanCollector` is always added as a span processor regardless
+ * of the user-provided options.
+ *
+ * @param options - Optional `SetupObservabilityOptions` forwarded to the
+ *   langwatch SDK `setupObservability()` function.
+ *
+ * @example
+ * ```typescript
+ * import { setupScenarioTracing } from "@langwatch/scenario";
+ *
+ * setupScenarioTracing({
+ *   instrumentations: [],          // disable auto-instrumentation
+ *   spanProcessors: [myProcessor], // add custom processors
+ * });
+ * ```
+ */
+declare function setupScenarioTracing(options?: Partial<SetupObservabilityOptions>): void;
+/**
+ * Criteria for matching spans by instrumentation scope name or span name.
+ * Within each field, matchers use OR semantics (any match succeeds).
+ * Across fields, AND semantics apply (all specified fields must match).
+ */
+interface TraceFilterCriteria {
+    instrumentationScopeName?: TraceFilterMatch[];
+    name?: TraceFilterMatch[];
+}
+/**
+ * A single match rule for string comparison.
+ */
+interface TraceFilterMatch {
+    equals?: string;
+    startsWith?: string;
+    matches?: RegExp;
+    ignoreCase?: boolean;
+}
+/**
+ * A filter rule for controlling which spans are exported.
+ *
+ * Compatible with the langwatch SDK's `TraceFilter` type used by
+ * `LangWatchTraceExporter`.
+ */
+type TraceFilter = {
+    preset: "vercelAIOnly" | "excludeHttpRequests";
+} | {
+    include: TraceFilterCriteria;
+} | {
+    exclude: TraceFilterCriteria;
+};
+/**
+ * Preset filter that only keeps spans from the @langwatch/scenario instrumentation scope.
+ * Use this to prevent unrelated server spans (HTTP, middleware, etc.) from being exported.
+ *
+ * @example
+ * ```typescript
+ * import { defineConfig, scenarioOnly } from "@langwatch/scenario";
+ * import { LangWatchTraceExporter } from "langwatch/observability";
+ *
+ * export default defineConfig({
+ *   observability: {
+ *     traceExporter: new LangWatchTraceExporter({
+ *       filters: scenarioOnly,
+ *     }),
+ *     instrumentations: [], // disable auto-instrumentation
+ *   },
+ * });
+ * ```
+ */
+declare const scenarioOnly: TraceFilter[];
+/**
+ * Creates a filter that keeps spans from the @langwatch/scenario scope
+ * plus any additional custom instrumentation scopes.
+ *
+ * @param scopes - Additional instrumentation scope names to include
+ * @returns Array of TraceFilter rules
+ *
+ * @example
+ * ```typescript
+ * import { defineConfig, withCustomScopes } from "@langwatch/scenario";
+ * import { LangWatchTraceExporter } from "langwatch/observability";
+ *
+ * export default defineConfig({
+ *   observability: {
+ *     traceExporter: new LangWatchTraceExporter({
+ *       filters: withCustomScopes("my-app/database", "my-app/agent"),
+ *     }),
+ *     instrumentations: [], // disable auto-instrumentation
+ *   },
+ * });
+ * ```
+ */
+declare function withCustomScopes(...scopes: string[]): TraceFilter[];
 type ScenarioApi = typeof agents & typeof domain & typeof execution & typeof runner & typeof script;
 declare const scenario: ScenarioApi;
-export { AgentAdapter, type AgentInput, type AgentReturnTypes, AgentRole, type AudioResponseEvent, DEFAULT_MAX_TURNS, DEFAULT_VERBOSE, type FinishTestArgs, type InvokeLLMParams, type InvokeLLMResult, JudgeAgentAdapter, type JudgeAgentConfig, type JudgeResult, JudgeSpanCollector, JudgeSpanDigestFormatter, type JudgmentRequest, RealtimeAgentAdapter, type RealtimeAgentAdapterConfig, type ScenarioConfig, type ScenarioConfigFinal, ScenarioExecution, type ScenarioExecutionLike, ScenarioExecutionState, type ScenarioExecutionStateLike, type ScenarioProjectConfig, type ScenarioResult, type ScriptStep, type StateChangeEvent, StateChangeEventType, type TestingAgentConfig, UserSimulatorAgentAdapter, agent, allAgentRoles, scenario as default, defineConfig, fail, judge, judgeAgent, judgeSpanCollector, judgeSpanDigestFormatter, message, proceed, run, scenario, scenarioProjectConfigSchema, succeed, user, userSimulatorAgent };
+export { AgentAdapter, type AgentInput, type AgentReturnTypes, AgentRole, type AudioResponseEvent, DEFAULT_MAX_TURNS, DEFAULT_VERBOSE, type FinishTestArgs, type InvokeLLMParams, type InvokeLLMResult, JudgeAgentAdapter, type JudgeAgentConfig, type JudgeResult, JudgeSpanCollector, JudgeSpanDigestFormatter, type JudgmentRequest, type LangwatchConfig, RealtimeAgentAdapter, type RealtimeAgentAdapterConfig, type RunOptions, type ScenarioConfig, type ScenarioConfigFinal, ScenarioExecution, type ScenarioExecutionLike, ScenarioExecutionState, type ScenarioExecutionStateLike, type ScenarioProjectConfig, type ScenarioResult, type ScriptStep, type StateChangeEvent, StateChangeEventType, type TestingAgentConfig, UserSimulatorAgentAdapter, agent, allAgentRoles, scenario as default, defineConfig, fail, judge, judgeAgent, judgeSpanCollector, judgeSpanDigestFormatter, message, proceed, run, scenario, scenarioOnly, scenarioProjectConfigSchema, setupScenarioTracing, succeed, user, userSimulatorAgent, withCustomScopes };