npm - @livekit/agents - Versions diffs - 1.0.34 → 1.0.36 - Mend

@livekit/agents 1.0.34 → 1.0.36

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (117) hide show

package/dist/cli.cjs.map +1 -1
package/dist/inference/api_protos.d.cts +4 -4
package/dist/inference/api_protos.d.ts +4 -4
package/dist/inference/llm.cjs +30 -3
package/dist/inference/llm.cjs.map +1 -1
package/dist/inference/llm.d.cts +3 -1
package/dist/inference/llm.d.ts +3 -1
package/dist/inference/llm.d.ts.map +1 -1
package/dist/inference/llm.js +30 -3
package/dist/inference/llm.js.map +1 -1
package/dist/ipc/inference_proc_executor.cjs.map +1 -1
package/dist/ipc/job_proc_executor.cjs.map +1 -1
package/dist/ipc/job_proc_lazy_main.cjs +1 -1
package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
package/dist/ipc/job_proc_lazy_main.js +1 -1
package/dist/ipc/job_proc_lazy_main.js.map +1 -1
package/dist/llm/chat_context.cjs +20 -2
package/dist/llm/chat_context.cjs.map +1 -1
package/dist/llm/chat_context.d.cts +9 -0
package/dist/llm/chat_context.d.ts +9 -0
package/dist/llm/chat_context.d.ts.map +1 -1
package/dist/llm/chat_context.js +20 -2
package/dist/llm/chat_context.js.map +1 -1
package/dist/llm/llm.cjs.map +1 -1
package/dist/llm/llm.d.cts +1 -0
package/dist/llm/llm.d.ts +1 -0
package/dist/llm/llm.d.ts.map +1 -1
package/dist/llm/llm.js.map +1 -1
package/dist/llm/provider_format/openai.cjs +43 -20
package/dist/llm/provider_format/openai.cjs.map +1 -1
package/dist/llm/provider_format/openai.d.ts.map +1 -1
package/dist/llm/provider_format/openai.js +43 -20
package/dist/llm/provider_format/openai.js.map +1 -1
package/dist/llm/provider_format/openai.test.cjs +35 -0
package/dist/llm/provider_format/openai.test.cjs.map +1 -1
package/dist/llm/provider_format/openai.test.js +35 -0
package/dist/llm/provider_format/openai.test.js.map +1 -1
package/dist/llm/provider_format/utils.cjs +1 -1
package/dist/llm/provider_format/utils.cjs.map +1 -1
package/dist/llm/provider_format/utils.d.ts.map +1 -1
package/dist/llm/provider_format/utils.js +1 -1
package/dist/llm/provider_format/utils.js.map +1 -1
package/dist/voice/agent_activity.cjs +19 -19
package/dist/voice/agent_activity.cjs.map +1 -1
package/dist/voice/agent_activity.d.ts.map +1 -1
package/dist/voice/agent_activity.js +19 -19
package/dist/voice/agent_activity.js.map +1 -1
package/dist/voice/agent_session.cjs +64 -25
package/dist/voice/agent_session.cjs.map +1 -1
package/dist/voice/agent_session.d.cts +25 -1
package/dist/voice/agent_session.d.ts +25 -1
package/dist/voice/agent_session.d.ts.map +1 -1
package/dist/voice/agent_session.js +64 -25
package/dist/voice/agent_session.js.map +1 -1
package/dist/voice/background_audio.cjs.map +1 -1
package/dist/voice/generation.cjs +2 -1
package/dist/voice/generation.cjs.map +1 -1
package/dist/voice/generation.d.ts.map +1 -1
package/dist/voice/generation.js +2 -1
package/dist/voice/generation.js.map +1 -1
package/dist/voice/index.cjs +14 -1
package/dist/voice/index.cjs.map +1 -1
package/dist/voice/index.d.cts +1 -0
package/dist/voice/index.d.ts +1 -0
package/dist/voice/index.d.ts.map +1 -1
package/dist/voice/index.js +3 -1
package/dist/voice/index.js.map +1 -1
package/dist/voice/room_io/room_io.cjs +1 -0
package/dist/voice/room_io/room_io.cjs.map +1 -1
package/dist/voice/room_io/room_io.d.ts.map +1 -1
package/dist/voice/room_io/room_io.js +1 -0
package/dist/voice/room_io/room_io.js.map +1 -1
package/dist/voice/speech_handle.cjs +12 -3
package/dist/voice/speech_handle.cjs.map +1 -1
package/dist/voice/speech_handle.d.cts +12 -2
package/dist/voice/speech_handle.d.ts +12 -2
package/dist/voice/speech_handle.d.ts.map +1 -1
package/dist/voice/speech_handle.js +10 -2
package/dist/voice/speech_handle.js.map +1 -1
package/dist/voice/testing/index.cjs +52 -0
package/dist/voice/testing/index.cjs.map +1 -0
package/dist/voice/testing/index.d.cts +20 -0
package/dist/voice/testing/index.d.ts +20 -0
package/dist/voice/testing/index.d.ts.map +1 -0
package/dist/voice/testing/index.js +31 -0
package/dist/voice/testing/index.js.map +1 -0
package/dist/voice/testing/run_result.cjs +477 -0
package/dist/voice/testing/run_result.cjs.map +1 -0
package/dist/voice/testing/run_result.d.cts +226 -0
package/dist/voice/testing/run_result.d.ts +226 -0
package/dist/voice/testing/run_result.d.ts.map +1 -0
package/dist/voice/testing/run_result.js +451 -0
package/dist/voice/testing/run_result.js.map +1 -0
package/dist/voice/testing/types.cjs +46 -0
package/dist/voice/testing/types.cjs.map +1 -0
package/dist/voice/testing/types.d.cts +83 -0
package/dist/voice/testing/types.d.ts +83 -0
package/dist/voice/testing/types.d.ts.map +1 -0
package/dist/voice/testing/types.js +19 -0
package/dist/voice/testing/types.js.map +1 -0
package/package.json +3 -3
package/src/inference/llm.ts +42 -3
package/src/ipc/job_proc_lazy_main.ts +1 -1
package/src/llm/chat_context.ts +32 -2
package/src/llm/llm.ts +1 -0
package/src/llm/provider_format/openai.test.ts +40 -0
package/src/llm/provider_format/openai.ts +46 -19
package/src/llm/provider_format/utils.ts +5 -1
package/src/voice/agent_activity.ts +24 -22
package/src/voice/agent_session.ts +73 -28
package/src/voice/generation.ts +1 -0
package/src/voice/index.ts +1 -0
package/src/voice/room_io/room_io.ts +1 -0
package/src/voice/speech_handle.ts +24 -4
package/src/voice/testing/index.ts +49 -0
package/src/voice/testing/run_result.ts +576 -0
package/src/voice/testing/types.ts +118 -0

package/src/voice/agent_session.ts CHANGED Viewed

@@ -61,6 +61,7 @@ import { RecorderIO } from './recorder_io/index.js';
 import { RoomIO, type RoomInputOptions, type RoomOutputOptions } from './room_io/index.js';
 import type { UnknownUserData } from './run_context.js';
 import type { SpeechHandle } from './speech_handle.js';
+import { RunResult } from './testing/run_result.js';
 export interface VoiceOptions {
   allowInterruptions: boolean;
@@ -167,6 +168,9 @@ export class AgentSession<
   /** @internal - Timestamp when the session started (milliseconds) */
   _startedAt?: number;
+  /** @internal - Current run state for testing */
+  _globalRunState?: RunResult;
   constructor(opts: AgentSessionOptions<UserData>) {
     super();
@@ -272,7 +276,7 @@ export class AgentSession<
     span,
   }: {
     agent: Agent;
-    room: Room;
+    room?: Room;
     inputOptions?: Partial<RoomInputOptions>;
     outputOptions?: Partial<RoomOutputOptions>;
     span: Span;
@@ -283,41 +287,45 @@ export class AgentSession<
     this._updateAgentState('initializing');
     const tasks: Promise<void>[] = [];
-    // Check for existing input/output configuration and warn if needed
-    if (this.input.audio && inputOptions?.audioEnabled !== false) {
-      this.logger.warn('RoomIO audio input is enabled but input.audio is already set, ignoring..');
-    }
-    if (this.output.audio && outputOptions?.audioEnabled !== false) {
-      this.logger.warn(
-        'RoomIO audio output is enabled but output.audio is already set, ignoring..',
-      );
-    }
+    if (room && !this.roomIO) {
+      // Check for existing input/output configuration and warn if needed
+      if (this.input.audio && inputOptions?.audioEnabled !== false) {
+        this.logger.warn(
+          'RoomIO audio input is enabled but input.audio is already set, ignoring..',
+        );
+      }
-    if (this.output.transcription && outputOptions?.transcriptionEnabled !== false) {
-      this.logger.warn(
-        'RoomIO transcription output is enabled but output.transcription is already set, ignoring..',
-      );
-    }
+      if (this.output.audio && outputOptions?.audioEnabled !== false) {
+        this.logger.warn(
+          'RoomIO audio output is enabled but output.audio is already set, ignoring..',
+        );
+      }
-    this.roomIO = new RoomIO({
-      agentSession: this,
-      room,
-      inputOptions,
-      outputOptions,
-    });
-    this.roomIO.start();
+      if (this.output.transcription && outputOptions?.transcriptionEnabled !== false) {
+        this.logger.warn(
+          'RoomIO transcription output is enabled but output.transcription is already set, ignoring..',
+        );
+      }
+      this.roomIO = new RoomIO({
+        agentSession: this,
+        room,
+        inputOptions,
+        outputOptions,
+      });
+      this.roomIO.start();
+    }
     let ctx: JobContext | undefined = undefined;
     try {
       ctx = getJobContext();
-    } catch (error) {
+    } catch {
       // JobContext is not available in evals
-      this.logger.warn('JobContext is not available');
     }
     if (ctx) {
-      if (ctx.room === room && !room.isConnected) {
+      if (room && ctx.room === room && !room.isConnected) {
         this.logger.debug('Auto-connecting to room via job context');
         tasks.push(ctx.connect());
       }
@@ -370,7 +378,7 @@ export class AgentSession<
     record,
   }: {
     agent: Agent;
-    room: Room;
+    room?: Room;
     inputOptions?: Partial<RoomInputOptions>;
     outputOptions?: Partial<RoomOutputOptions>;
     record?: boolean;
@@ -497,13 +505,50 @@ export class AgentSession<
     // attach to the session span if called outside of the AgentSession
     const activeSpan = trace.getActiveSpan();
+    let handle: SpeechHandle;
     if (!activeSpan && this.rootSpanContext) {
-      return otelContext.with(this.rootSpanContext, () =>
+      handle = otelContext.with(this.rootSpanContext, () =>
         doGenerateReply(this.activity!, this.nextActivity),
       );
+    } else {
+      handle = doGenerateReply(this.activity!, this.nextActivity);
     }
-    return doGenerateReply(this.activity!, this.nextActivity);
+    if (this._globalRunState) {
+      this._globalRunState._watchHandle(handle);
+    }
+    return handle;
+  }
+  /**
+   * Run a test with user input and return a result for assertions.
+   *
+   * This method is primarily used for testing agent behavior without
+   * requiring a real room connection.
+   *
+   * @example
+   * ```typescript
+   * const result = await session.run({ userInput: 'Hello' });
+   * result.expect.nextEvent().isMessage({ role: 'assistant' });
+   * result.expect.noMoreEvents();
+   * ```
+   *
+   * @param options - Run options including user input
+   * @returns A RunResult that resolves when the agent finishes responding
+   *
+   * TODO: Add outputType parameter for typed outputs (parity with Python)
+   */
+  run(options: { userInput: string }): RunResult {
+    if (this._globalRunState && !this._globalRunState.done()) {
+      throw new Error('nested runs are not supported');
+    }
+    const runState = new RunResult({ userInput: options.userInput });
+    this._globalRunState = runState;
+    this.generateReply({ userInput: options.userInput });
+    return runState;
   }
   private async updateActivity(agent: Agent): Promise<void> {

package/src/voice/generation.ts CHANGED Viewed

@@ -444,6 +444,7 @@ export function performLLMInference(
                 args: tool.args,
                 // Preserve thought signature for Gemini 3+ thinking mode
                 thoughtSignature: tool.thoughtSignature,
+                extra: tool.extra || {},
               });
               data.generatedToolCalls.push(toolCall);

package/src/voice/index.ts CHANGED Viewed

@@ -10,3 +10,4 @@ export { type TimedString } from './io.js';
 export * from './report.js';
 export * from './room_io/index.js';
 export { RunContext } from './run_context.js';
+export * as testing from './testing/index.js';

package/src/voice/room_io/room_io.ts CHANGED Viewed

@@ -51,6 +51,7 @@ const DEFAULT_TEXT_INPUT_CALLBACK: TextInputCallback = (sess: AgentSession, ev:
 };
 const DEFAULT_PARTICIPANT_KINDS: ParticipantKind[] = [
+  ParticipantKind.CONNECTOR,
   ParticipantKind.SIP,
   ParticipantKind.STANDARD,
 ];

package/src/voice/speech_handle.ts CHANGED Viewed

@@ -2,10 +2,25 @@
 //
 // SPDX-License-Identifier: Apache-2.0
 import type { ChatItem } from '../llm/index.js';
-import { Event, Future, shortuuid } from '../utils.js';
 import type { Task } from '../utils.js';
+import { Event, Future, shortuuid } from '../utils.js';
 import { asyncLocalStorage } from './agent.js';
+/** Symbol used to identify SpeechHandle instances */
+const SPEECH_HANDLE_SYMBOL = Symbol.for('livekit.agents.SpeechHandle');
+/**
+ * Type guard to check if a value is a SpeechHandle.
+ */
+export function isSpeechHandle(value: unknown): value is SpeechHandle {
+  return (
+    typeof value === 'object' &&
+    value !== null &&
+    SPEECH_HANDLE_SYMBOL in value &&
+    (value as Record<symbol, boolean>)[SPEECH_HANDLE_SYMBOL] === true
+  );
+}
 export class SpeechHandle {
   /** Priority for messages that should be played after all other messages in the queue */
   static SPEECH_PRIORITY_LOW = 0;
@@ -18,16 +33,21 @@ export class SpeechHandle {
   private authorizedEvent = new Event();
   private scheduledFut = new Future<void>();
   private doneFut = new Future<void>();
   private generations: Future<void>[] = [];
+  private _chatItems: ChatItem[] = [];
   /** @internal */
   _tasks: Task<void>[] = [];
-  private _chatItems: ChatItem[] = [];
-  private _numSteps = 1;
+  /** @internal */
+  _numSteps = 1;
   private itemAddedCallbacks: Set<(item: ChatItem) => void> = new Set();
   private doneCallbacks: Set<(sh: SpeechHandle) => void> = new Set();
+  /** @internal Symbol marker for type identification */
+  readonly [SPEECH_HANDLE_SYMBOL] = true;
   constructor(
     private _id: string,
     private _allowInterruptions: boolean,

package/src/voice/testing/index.ts ADDED Viewed

@@ -0,0 +1,49 @@
+// SPDX-FileCopyrightText: 2025 LiveKit, Inc.
+//
+// SPDX-License-Identifier: Apache-2.0
+/**
+ * Testing utilities for agent evaluation.
+ *
+ * @example
+ * ```typescript
+ * import { AgentSession, Agent, voice } from '@livekit/agents';
+ *
+ * const session = new AgentSession({ llm });
+ * await session.start(agent);
+ *
+ * const result = await session.run({ userInput: 'Hello' });
+ * result.expect.nextEvent().isMessage({ role: 'assistant' });
+ * result.expect.noMoreEvents();
+ * ```
+ *
+ * @packageDocumentation
+ */
+export {
+  AgentHandoffAssert,
+  AssertionError,
+  EventAssert,
+  FunctionCallAssert,
+  FunctionCallOutputAssert,
+  MessageAssert,
+  RunAssert,
+  RunResult,
+} from './run_result.js';
+export {
+  isAgentHandoffEvent,
+  isChatMessageEvent,
+  isFunctionCallEvent,
+  isFunctionCallOutputEvent,
+  type AgentHandoffAssertOptions,
+  type AgentHandoffEvent,
+  type ChatMessageEvent,
+  type EventType,
+  type FunctionCallAssertOptions,
+  type FunctionCallEvent,
+  type FunctionCallOutputAssertOptions,
+  type FunctionCallOutputEvent,
+  type MessageAssertOptions,
+  type RunEvent,
+} from './types.js';