npm - @dtelecom/agents-js - Versions diffs - 0.2.2 → 0.3.1 - Mend

@dtelecom/agents-js 0.2.2 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/dist/index.d.mts +4 -2
package/dist/index.d.ts +4 -2
package/dist/index.js +44 -15
package/dist/index.js.map +1 -1
package/dist/index.mjs +44 -15
package/dist/index.mjs.map +1 -1
package/dist/memory/index.d.mts +1 -1
package/dist/memory/index.d.ts +1 -1
package/dist/providers/index.d.mts +1 -1
package/dist/providers/index.d.ts +1 -1
package/dist/providers/index.js +42 -0
package/dist/providers/index.js.map +1 -1
package/dist/providers/index.mjs +42 -0
package/dist/providers/index.mjs.map +1 -1
package/dist/{types-BBKtiPvm.d.mts → types-BJylZd8Q.d.mts} +28 -5
package/dist/{types-BBKtiPvm.d.ts → types-BJylZd8Q.d.ts} +28 -5
package/package.json +1 -1

package/dist/{types-BBKtiPvm.d.mts → types-BJylZd8Q.d.mts} RENAMED Viewed

@@ -85,6 +85,9 @@ declare class AudioOutput {
     private _responding;
     private _stopped;
     private silenceInterval;
+    /** Resolves when the RTP transport is ready and initial silence has been sent. */
+    readonly whenReady: Promise<void>;
+    private _resolveReady?;
     /** When set, raw PCM from TTS is saved to this directory as WAV files for debugging. */
     dumpDir: string | null;
     private dumpCounter;
@@ -164,6 +167,19 @@ interface Message {
     role: 'system' | 'user' | 'assistant';
     content: string;
 }
+interface ToolDefinition {
+    type: 'function';
+    function: {
+        name: string;
+        description: string;
+        parameters: Record<string, unknown>;
+    };
+}
+interface ToolCallResult {
+    id: string;
+    name: string;
+    arguments: string;
+}
 interface LLMChunk {
     type: 'token' | 'segment' | 'tool_call' | 'done';
     token?: string;
@@ -171,10 +187,7 @@ interface LLMChunk {
         lang: string;
         text: string;
     };
-    toolCall?: {
-        name: string;
-        arguments: string;
-    };
+    toolCall?: ToolCallResult;
     usage?: {
         promptTokens: number;
         completionTokens: number;
@@ -183,6 +196,8 @@ interface LLMChunk {
 interface LLMChatOptions {
     /** Skip structured output (responseFormat) for this call — return plain text tokens. */
     plainText?: boolean;
+    /** Tool definitions to pass to the LLM for function calling. */
+    tools?: ToolDefinition[];
 }
 interface LLMPlugin {
     chat(messages: Message[], signal?: AbortSignal, options?: LLMChatOptions): AsyncGenerator<LLMChunk>;
@@ -226,6 +241,8 @@ interface AgentConfig {
     memory?: MemoryConfig;
     /** Max context tokens before triggering summarization (default: 5000) */
     maxContextTokens?: number;
+    /** Tool definitions for LLM function calling. */
+    tools?: ToolDefinition[];
 }
 interface AgentStartOptions {
     room: string;
@@ -260,6 +277,8 @@ interface PipelineOptions {
     memory?: RoomMemory;
     /** Max context tokens before triggering summarization (default: 5000) */
     maxContextTokens?: number;
+    /** Tool definitions for LLM function calling. */
+    tools?: ToolDefinition[];
 }
 type AgentState = 'idle' | 'listening' | 'thinking' | 'speaking';
 interface AgentEvents {
@@ -272,6 +291,8 @@ interface AgentEvents {
     response: (text: string) => void;
     /** Agent state: idle → listening (STT active) → thinking (LLM) → speaking (audio) → idle. */
     agentState: (state: AgentState) => void;
+    /** Emitted when the LLM invokes a tool. */
+    toolCall: (toolCall: ToolCallResult) => void;
     error: (error: Error) => void;
     connected: () => void;
     disconnected: (reason?: string) => void;
@@ -283,7 +304,9 @@ interface PipelineEvents {
     sentence: (text: string) => void;
     response: (text: string) => void;
     agentState: (state: AgentState) => void;
+    /** Emitted when the LLM invokes a tool. */
+    toolCall: (toolCall: ToolCallResult) => void;
     error: (error: Error) => void;
 }
-export { type AgentConfig as A, type DataMessageHandler as D, Embedder as E, type LLMPlugin as L, type Message as M, type PipelineOptions as P, type RespondMode as R, type STTStream as S, type TranscriptionResult as T, type AgentStartOptions as a, type AgentState as b, type AgentEvents as c, AudioOutput as d, type LLMChatOptions as e, type LLMChunk as f, type MemoryConfig as g, type PipelineEvents as h, type STTPlugin as i, type STTStreamOptions as j, type TTSPlugin as k, RoomMemory as l, type RoomMemoryConfig as m };
+export { type AgentConfig as A, type DataMessageHandler as D, Embedder as E, type LLMPlugin as L, type Message as M, type PipelineOptions as P, type RespondMode as R, type STTStream as S, type TranscriptionResult as T, type AgentStartOptions as a, type AgentState as b, type AgentEvents as c, AudioOutput as d, type LLMChatOptions as e, type LLMChunk as f, type MemoryConfig as g, type PipelineEvents as h, type STTPlugin as i, type STTStreamOptions as j, type TTSPlugin as k, type ToolCallResult as l, type ToolDefinition as m, RoomMemory as n, type RoomMemoryConfig as o };

package/dist/{types-BBKtiPvm.d.ts → types-BJylZd8Q.d.ts} RENAMED Viewed

@@ -85,6 +85,9 @@ declare class AudioOutput {
     private _responding;
     private _stopped;
     private silenceInterval;
+    /** Resolves when the RTP transport is ready and initial silence has been sent. */
+    readonly whenReady: Promise<void>;
+    private _resolveReady?;
     /** When set, raw PCM from TTS is saved to this directory as WAV files for debugging. */
     dumpDir: string | null;
     private dumpCounter;
@@ -164,6 +167,19 @@ interface Message {
     role: 'system' | 'user' | 'assistant';
     content: string;
 }
+interface ToolDefinition {
+    type: 'function';
+    function: {
+        name: string;
+        description: string;
+        parameters: Record<string, unknown>;
+    };
+}
+interface ToolCallResult {
+    id: string;
+    name: string;
+    arguments: string;
+}
 interface LLMChunk {
     type: 'token' | 'segment' | 'tool_call' | 'done';
     token?: string;
@@ -171,10 +187,7 @@ interface LLMChunk {
         lang: string;
         text: string;
     };
-    toolCall?: {
-        name: string;
-        arguments: string;
-    };
+    toolCall?: ToolCallResult;
     usage?: {
         promptTokens: number;
         completionTokens: number;
@@ -183,6 +196,8 @@ interface LLMChunk {
 interface LLMChatOptions {
     /** Skip structured output (responseFormat) for this call — return plain text tokens. */
     plainText?: boolean;
+    /** Tool definitions to pass to the LLM for function calling. */
+    tools?: ToolDefinition[];
 }
 interface LLMPlugin {
     chat(messages: Message[], signal?: AbortSignal, options?: LLMChatOptions): AsyncGenerator<LLMChunk>;
@@ -226,6 +241,8 @@ interface AgentConfig {
     memory?: MemoryConfig;
     /** Max context tokens before triggering summarization (default: 5000) */
     maxContextTokens?: number;
+    /** Tool definitions for LLM function calling. */
+    tools?: ToolDefinition[];
 }
 interface AgentStartOptions {
     room: string;
@@ -260,6 +277,8 @@ interface PipelineOptions {
     memory?: RoomMemory;
     /** Max context tokens before triggering summarization (default: 5000) */
     maxContextTokens?: number;
+    /** Tool definitions for LLM function calling. */
+    tools?: ToolDefinition[];
 }
 type AgentState = 'idle' | 'listening' | 'thinking' | 'speaking';
 interface AgentEvents {
@@ -272,6 +291,8 @@ interface AgentEvents {
     response: (text: string) => void;
     /** Agent state: idle → listening (STT active) → thinking (LLM) → speaking (audio) → idle. */
     agentState: (state: AgentState) => void;
+    /** Emitted when the LLM invokes a tool. */
+    toolCall: (toolCall: ToolCallResult) => void;
     error: (error: Error) => void;
     connected: () => void;
     disconnected: (reason?: string) => void;
@@ -283,7 +304,9 @@ interface PipelineEvents {
     sentence: (text: string) => void;
     response: (text: string) => void;
     agentState: (state: AgentState) => void;
+    /** Emitted when the LLM invokes a tool. */
+    toolCall: (toolCall: ToolCallResult) => void;
     error: (error: Error) => void;
 }
-export { type AgentConfig as A, type DataMessageHandler as D, Embedder as E, type LLMPlugin as L, type Message as M, type PipelineOptions as P, type RespondMode as R, type STTStream as S, type TranscriptionResult as T, type AgentStartOptions as a, type AgentState as b, type AgentEvents as c, AudioOutput as d, type LLMChatOptions as e, type LLMChunk as f, type MemoryConfig as g, type PipelineEvents as h, type STTPlugin as i, type STTStreamOptions as j, type TTSPlugin as k, RoomMemory as l, type RoomMemoryConfig as m };
+export { type AgentConfig as A, type DataMessageHandler as D, Embedder as E, type LLMPlugin as L, type Message as M, type PipelineOptions as P, type RespondMode as R, type STTStream as S, type TranscriptionResult as T, type AgentStartOptions as a, type AgentState as b, type AgentEvents as c, AudioOutput as d, type LLMChatOptions as e, type LLMChunk as f, type MemoryConfig as g, type PipelineEvents as h, type STTPlugin as i, type STTStreamOptions as j, type TTSPlugin as k, type ToolCallResult as l, type ToolDefinition as m, RoomMemory as n, type RoomMemoryConfig as o };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@dtelecom/agents-js",
-  "version": "0.2.2",
+  "version": "0.3.1",
   "description": "AI voice agent framework for dTelecom rooms",
   "main": "./dist/index.js",
   "module": "./dist/index.mjs",